Addressing comments

1d391bba · rprenger · b0c824d9 · 1d391bba · 1d391bba
Commit 1d391bba authored Feb 10, 2022 by rprenger
Hide whitespace changes
Inline Side-by-side

Showing with 17 additions and 0 deletions

megatron/static/index.html megatron/static/index.html +15 -0

megatron/text_generation/generation.py megatron/text_generation/generation.py +2 -0

No files found.
--- a/megatron/static/index.html
+++ b/megatron/static/index.html
+<!-- coding=utf-8-->
+<!-- Copyright (c) 2020, NVIDIA CORPORATION.  All rights reserved.-->
+<!---->
+<!-- Licensed under the Apache License, Version 2.0 (the "License");-->
+<!-- you may not use this file except in compliance with the License.-->
+<!-- You may obtain a copy of the License at-->
+<!---->
+<!--     http://www.apache.org/licenses/LICENSE-2.0-->
+<!---->
+<!-- Unless required by applicable law or agreed to in writing, software-->
+<!-- distributed under the License is distributed on an "AS IS" BASIS,-->
+<!-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.-->
+<!-- See the License for the specific language governing permissions and-->
+<!-- limitations under the License.-->
+
 <!DOCTYPE html>
 <html lang="en">
 <head>

--- a/megatron/text_generation/generation.py
+++ b/megatron/text_generation/generation.py
@@ -234,6 +234,8 @@ def generate_tokens_probs_and_return_on_first_stage(
            # Check if all the sequences have hit the termination_id.
            done = None
            if mpu.is_pipeline_last_stage():
+                # TODO(rprenger) These stopping methods are tokenizer dependent
+                # instead tokenization should be in the inference loop so stop sequences can be used
                if stop_on_double_eol:
                    hit_double_eol = (new_sample == 628).byte() & started.byte()
                    hit_two_eols = (new_sample == 198).byte() & (tokens[:, context_length-1] == 198).byte() & started.byte()