Spaces:

YuvrajSingh9886
/

StoryKimi-Zero

Sleeping

yuvraj-singh-9886 commited on Aug 9

Commit

c156c1f

1 Parent(s): c41577c

Add liger-kernel dependency and update model files

Files changed (3) hide show

app.py CHANGED Viewed

@@ -55,7 +55,16 @@ def initialize_app():
             print("Tokenizer initialized successfully")
         except Exception as e:
             print(f"Error initializing tokenizer: {e}")
-            raise e
     # Initialize the global tokenizer in model.py
     initialize_tokenizer(hf_token=hf_token)

             print("Tokenizer initialized successfully")
         except Exception as e:
             print(f"Error initializing tokenizer: {e}")
+            print("This might be due to missing HF_TOKEN or lack of access to gated models.")
+            print("The app will try to use a fallback tokenizer.")
+            # Don't raise the error, let the tokenizer handle fallback
+            try:
+                tk = Tokenizer(hf_token=None)  # Force fallback
+                tk = tk.ready_tokenizer()
+                print("Fallback tokenizer initialized successfully")
+            except Exception as fallback_error:
+                print(f"Fallback tokenizer also failed: {fallback_error}")
+                raise fallback_error
     # Initialize the global tokenizer in model.py
     initialize_tokenizer(hf_token=hf_token)

requirements.txt CHANGED Viewed

@@ -7,3 +7,4 @@ huggingface_hub
 gradio
 numpy
 safetensors

 gradio
 numpy
 safetensors
+liger-kernel

tokenizer.py CHANGED Viewed

@@ -9,8 +9,19 @@ class Tokenizer:
             print(f"[INFO] Using HF token for model access")
         else:
             print("[INFO] No HF token provided - using public models only")
-        self.tokenizer = AutoTokenizer.from_pretrained("meta-llama/Llama-2-7b-hf", token=hf_token)
         self.tokenizer.add_special_tokens({'pad_token': '[PAD]'})
     def ready_tokenizer(self):

             print(f"[INFO] Using HF token for model access")
         else:
             print("[INFO] No HF token provided - using public models only")
+        # Use a public tokenizer instead of gated Llama model
+        # GPT-2 tokenizer is widely compatible and doesn't require authentication
+        try:
+            if hf_token:
+                # Try Llama tokenizer first if we have a token
+                self.tokenizer = AutoTokenizer.from_pretrained("meta-llama/Llama-2-7b-hf", token=hf_token)
+            else:
+                raise Exception("No token - using fallback")
+        except:
+            print("[INFO] Fallback to public GPT-2 tokenizer")
+            self.tokenizer = AutoTokenizer.from_pretrained("gpt2")
         self.tokenizer.add_special_tokens({'pad_token': '[PAD]'})
     def ready_tokenizer(self):