Spaces:

masanorihirano
/

plamo-2-1b

Running

masanorihirano commited on Feb 12

Commit

77f7edf

verified ·

1 Parent(s): 53f0151

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -79,7 +79,7 @@ class ThreadManager:
 def respond(prompt, max_tokens):
-    print(prompt)
     streamer = TextIteratorStreamer(
         tokenizer, skip_prompt=True, skip_special_tokens=True
@@ -104,7 +104,7 @@ def respond(prompt, max_tokens):
         for output in streamer:
             if not output:
                 continue
-            print(output)
             response += output
             yield response, gr.update(interactive=False), gr.update(interactive=False),
         yield (
@@ -125,7 +125,7 @@ def no_interactive():
 with gr.Blocks() as demo:
     gr.HTML("""<h1 align="center">plamo-2-1b CPU demo</h1>""")
     gr.Markdown(
-        "2 vCPU, 16 GB RAMでのデモです。5年前くらいのノートパソコンくらい。(GPUなしのHF中国镜像站の無料インスタンスで動いています。)vllmとかllama.cppが対応すればもっと高速に動くはず。"
     )
     with gr.Column(elem_id="col_container") as main_block:
         with gr.Row():

 def respond(prompt, max_tokens):
+    # print(prompt)
     streamer = TextIteratorStreamer(
         tokenizer, skip_prompt=True, skip_special_tokens=True
         for output in streamer:
             if not output:
                 continue
+            # print(output)
             response += output
             yield response, gr.update(interactive=False), gr.update(interactive=False),
         yield (
 with gr.Blocks() as demo:
     gr.HTML("""<h1 align="center">plamo-2-1b CPU demo</h1>""")
     gr.Markdown(
+        "2 vCPU, 16 GB RAMでのデモです。10年前くらいのノートパソコンくらい。(GPUなしのHF中国镜像站の無料インスタンスで動いています。)vllmとかllama.cppが対応すればもっと高速に動くはず。"
     )
     with gr.Column(elem_id="col_container") as main_block:
         with gr.Row():