Research-chatbot

Runtime error

App Files Files Community

pseudotensor commited on Apr 24, 2023

Commit

3035e40

1 Parent(s): 1c674f6

Update with h2oGPT hash c86dd3b6ef211cef2f99ece2714de09c03e1c490

Browse files

Files changed (5) hide show

app.py +25 -11
client_test.py +1 -1
finetune.py +1 -3
requirements.txt +4 -2
utils.py +33 -1

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ import sys
 import os
 import traceback
 import typing
-from utils import set_seed, flatten_list, clear_torch_cache, system_info_print, zip_data, save_generate_output
 SEED = 1236
 set_seed(SEED)
@@ -556,6 +556,7 @@ def go_gradio(**kwargs):
     else:
         description = "For more information, visit [the project's website](https://github.com/h2oai/h2ogpt).<br>"
     if is_public:
         description += """<p><b> DISCLAIMERS: </b><ul><i><li>The model was trained on The Pile and other data, which may contain objectionable content.  Use at own risk.</i></li>"""
         if kwargs['load_8bit']:
             description += """<i><li> Model is loaded in 8-bit and has other restrictions on this host. UX can be worse than non-hosted version.</i></li>"""
@@ -891,25 +892,38 @@ body.dark{background:linear-gradient(#0d0d0d,#333333);}"""
                                     lora_used2 = gr.Textbox(label="Current LORA 2", value=no_lora_str,
                                                             visible=kwargs['show_lora'])
                 with gr.TabItem("System"):
                     system_row = gr.Row(visible=not is_public)
-                    admin_pass_textbox = gr.Textbox(label="Admin Password", type='password', visible=is_public)
-                    admin_btn = gr.Button(value="admin", visible=is_public)
                     with system_row:
                         with gr.Column():
-                            system_text = gr.Textbox(label='System Info')
-                            system_btn = gr.Button(value='Get System Info')
-                            zip_btn = gr.Button("Zip")
-                            file_output = gr.File()
         # Get flagged data
         zip_data1 = functools.partial(zip_data, root_dirs=['flagged_data_points', kwargs['save_dir']])
-        zip_btn.click(zip_data1, inputs=None, outputs=file_output)
         def check_admin_pass(x):
             return gr.update(visible=x == admin_pass)
-        admin_btn.click(check_admin_pass, inputs=admin_pass_textbox, outputs=system_row)
         # Get inputs to evaluate()
         inputs_list = get_inputs_list(locals(), kwargs['model_lower'])
@@ -1953,7 +1967,7 @@ if __name__ == "__main__":
     can also pass --prompt_type='human_bot' and model can somewhat handle instructions without being instruct tuned
     python generate.py --base_model=decapoda-research/llama-65b-hf --load_8bit=False --infer_devices=False --prompt_type='human_bot'
-    python generate.py --base_model=h2oai/h2ogpt-oig-oasst1-256-6.9b
     """, flush=True)
     fire.Fire(main)

 import os
 import traceback
 import typing
+from utils import set_seed, flatten_list, clear_torch_cache, system_info_print, zip_data, save_generate_output, s3up
 SEED = 1236
 set_seed(SEED)
     else:
         description = "For more information, visit [the project's website](https://github.com/h2oai/h2ogpt).<br>"
     if is_public:
+        description += "If this host is busy, try [20B](gpt.h2o.ai) and [Chatbot1 12B](https://huggingface.co/spaces/h2oai/h2ogpt-chatbot) and [Chatbot2 12B](https://huggingface.co/spaces/h2oai/h2ogpt-chatbot2)<br>"
         description += """<p><b> DISCLAIMERS: </b><ul><i><li>The model was trained on The Pile and other data, which may contain objectionable content.  Use at own risk.</i></li>"""
         if kwargs['load_8bit']:
             description += """<i><li> Model is loaded in 8-bit and has other restrictions on this host. UX can be worse than non-hosted version.</i></li>"""
                                     lora_used2 = gr.Textbox(label="Current LORA 2", value=no_lora_str,
                                                             visible=kwargs['show_lora'])
                 with gr.TabItem("System"):
+                    admin_row = gr.Row()
+                    with admin_row:
+                        admin_pass_textbox = gr.Textbox(label="Admin Password", type='password', visible=is_public)
+                        admin_btn = gr.Button(value="Admin Access", visible=is_public)
                     system_row = gr.Row(visible=not is_public)
                     with system_row:
                         with gr.Column():
+                            with gr.Row():
+                                system_btn = gr.Button(value='Get System Info')
+                                system_text = gr.Textbox(label='System Info')
+                            with gr.Row():
+                                zip_btn = gr.Button("Zip")
+                                zip_text = gr.Textbox(label="Zip file name")
+                                file_output = gr.File()
+                            with gr.Row():
+                                s3up_btn = gr.Button("S3UP")
+                                s3up_text = gr.Textbox(label='S3UP result')
         # Get flagged data
         zip_data1 = functools.partial(zip_data, root_dirs=['flagged_data_points', kwargs['save_dir']])
+        zip_btn.click(zip_data1, inputs=None, outputs=[file_output, zip_text])
+        s3up_btn.click(s3up, inputs=zip_text, outputs=s3up_text)
         def check_admin_pass(x):
             return gr.update(visible=x == admin_pass)
+        def close_admin(x):
+            return gr.update(visible=not (x == admin_pass))
+        admin_btn.click(check_admin_pass, inputs=admin_pass_textbox, outputs=system_row) \
+                 .then(close_admin, inputs=admin_pass_textbox, outputs=admin_row)
         # Get inputs to evaluate()
         inputs_list = get_inputs_list(locals(), kwargs['model_lower'])
     can also pass --prompt_type='human_bot' and model can somewhat handle instructions without being instruct tuned
     python generate.py --base_model=decapoda-research/llama-65b-hf --load_8bit=False --infer_devices=False --prompt_type='human_bot'
+    python generate.py --base_model=h2oai/h2ogpt-oig-oasst1-512-6.9b
     """, flush=True)
     fire.Fire(main)

client_test.py CHANGED Viewed

@@ -3,7 +3,7 @@ Client test.
 Run server:
-python generate.py  --base_model=h2oai/h2ogpt-oig-oasst1-256-6.9b
 NOTE: For private models, add --use-auth_token=True

 Run server:
+python generate.py  --base_model=h2oai/h2ogpt-oig-oasst1-512-6.9b
 NOTE: For private models, add --use-auth_token=True

finetune.py CHANGED Viewed

@@ -84,11 +84,9 @@ prompt_type_to_model_name = {
     'instruct_with_end': ['databricks/dolly-v2-12b'],
     'quality': [],
     'human_bot': [
-        'h2oai/h2ogpt-oig-oasst1-256-12b',
         'h2oai/h2ogpt-oasst1-512-12b',
-        'h2oai/h2ogpt-oasst1-256-20b',
         'h2oai/h2ogpt-oasst1-512-20b',
-        'h2oai/h2ogpt-oig-oasst1-256-6.9b',
     ],
     'dai_faq': [],
     'summarize': [],

     'instruct_with_end': ['databricks/dolly-v2-12b'],
     'quality': [],
     'human_bot': [
         'h2oai/h2ogpt-oasst1-512-12b',
         'h2oai/h2ogpt-oasst1-512-20b',
+        'h2oai/h2ogpt-oig-oasst1-512-6.9b',
     ],
     'dai_faq': [],
     'summarize': [],

requirements.txt CHANGED Viewed

@@ -1,5 +1,5 @@
 # for generate (gradio server) and finetune
-datasets==2.10.1
 sentencepiece==0.1.97
 accelerate==0.18.0
 gradio==3.27.0
@@ -15,7 +15,7 @@ scikit-learn==1.2.2
 alt-profanity-check==1.2.2
 better-profanity==0.6.1
 numpy==1.24.2
-pandas==1.5.3
 matplotlib==3.7.1
 loralib==0.1.1
 bitsandbytes==0.38.1
@@ -26,6 +26,8 @@ tokenizers==0.13.3
 # optional for generate
 pynvml==11.5.0
 psutil==5.9.4
 # optional for finetune
 tensorboard==2.12.1

 # for generate (gradio server) and finetune
+datasets==2.11.0
 sentencepiece==0.1.97
 accelerate==0.18.0
 gradio==3.27.0
 alt-profanity-check==1.2.2
 better-profanity==0.6.1
 numpy==1.24.2
+pandas==2.0.0
 matplotlib==3.7.1
 loralib==0.1.1
 bitsandbytes==0.38.1
 # optional for generate
 pynvml==11.5.0
 psutil==5.9.4
+boto3==1.26.101
+botocore==1.29.101
 # optional for finetune
 tensorboard==2.12.1

utils.py CHANGED Viewed

@@ -118,7 +118,7 @@ def _zip_data(root_dirs=None, zip_file=None, base_dir='./'):
                     assert os.path.exists(file_to_archive)
                     path_to_archive = os.path.relpath(file_to_archive, base_dir)
                     expt_zip.write(filename=file_to_archive, arcname=path_to_archive)
-    return zip_file
 def save_generate_output(output=None, base_model=None, save_dir=None):
@@ -152,3 +152,35 @@ def _save_generate_output(output=None, base_model=None, save_dir=None):
                     dict(text=output, time=time.ctime(), base_model=base_model)
                 ) + ",\n"
             )

                     assert os.path.exists(file_to_archive)
                     path_to_archive = os.path.relpath(file_to_archive, base_dir)
                     expt_zip.write(filename=file_to_archive, arcname=path_to_archive)
+    return zip_file, zip_file
 def save_generate_output(output=None, base_model=None, save_dir=None):
                     dict(text=output, time=time.ctime(), base_model=base_model)
                 ) + ",\n"
             )
+def s3up(filename):
+    try:
+        return _s3up(filename)
+    except Exception as e:
+        traceback.print_exc()
+        print('Exception for file %s in s3up: %s' % (filename, str(e)))
+        return "Failed to upload %s: Error: %s" % (filename, str(e))
+def _s3up(filename):
+    import boto3
+    aws_access_key_id = os.getenv('AWS_SERVER_PUBLIC_KEY')
+    aws_secret_access_key = os.getenv('AWS_SERVER_SECRET_KEY')
+    bucket = os.getenv('AWS_BUCKET')
+    assert aws_access_key_id, "Set AWS key"
+    assert aws_secret_access_key, "Set AWS secret"
+    assert bucket, "Set AWS Bucket"
+    s3 = boto3.client('s3',
+                      aws_access_key_id=os.getenv('AWS_SERVER_PUBLIC_KEY'),
+                      aws_secret_access_key=os.getenv('AWS_SERVER_SECRET_KEY'),
+                      )
+    ret = s3.upload_file(
+        Filename=filename,
+        Bucket=os.getenv('AWS_BUCKET'),
+        Key=filename,
+    )
+    if ret in [None, '']:
+        return "Successfully uploaded %s" % filename