Spaces:
Runtime error
Runtime error
fix bug, reduce memory footprint
Browse files
app.py
CHANGED
|
@@ -21,8 +21,9 @@ def sanitize_jinja2(jinja_lines):
|
|
| 21 |
def get_existing_templates():
|
| 22 |
return [None] + os.listdir("./templates")
|
| 23 |
|
| 24 |
-
if
|
| 25 |
-
|
|
|
|
| 26 |
|
| 27 |
# Initialization
|
| 28 |
if 'tokenizer_json' not in st.session_state:
|
|
@@ -83,12 +84,14 @@ if gen_button:
|
|
| 83 |
st.session_state['tokenizer'] = AutoTokenizer.from_pretrained(hf_model_repo_name)
|
| 84 |
|
| 85 |
st.session_state['repo_normalized_name'] = hf_model_repo_name.replace("/", "_")
|
| 86 |
-
st.session_state['tokenizer'].save_pretrained(f"./tmp/{st.session_state['uuid']}_{hf_model_repo_name}")
|
| 87 |
st.session_state['tokenizer_json'] = f"./tmp/{st.session_state['uuid']}_{hf_model_repo_name}"
|
|
|
|
| 88 |
|
| 89 |
if st.session_state['tokenizer_json'] is not None:
|
|
|
|
| 90 |
with open(f"{st.session_state['tokenizer_json']}/tokenizer_config.json", "rb") as f:
|
| 91 |
tokenizer_json = json.load(f)
|
|
|
|
| 92 |
|
| 93 |
json_spec, col2 = st.columns(spec=[0.3, 0.7])
|
| 94 |
|
|
@@ -146,6 +149,7 @@ if st.session_state['tokenizer_json'] is not None:
|
|
| 146 |
with open(f"./tmp/{st.session_state['uuid']}/tmp_chat_template.json", "r") as f:
|
| 147 |
jinja_lines = f.readlines()
|
| 148 |
st.session_state['tokenizer'].chat_template = sanitize_jinja2(jinja_lines)
|
|
|
|
| 149 |
generated_prompt_wo_add_generation_prompt = st.session_state['tokenizer'].apply_chat_template(chat, tokenize=False, add_generation_prompt= False)
|
| 150 |
generated_prompt_w_add_generation_prompt = st.session_state['tokenizer'].apply_chat_template(chat, tokenize=False, add_generation_prompt= True)
|
| 151 |
|
|
@@ -166,10 +170,11 @@ if st.session_state['tokenizer_json'] is not None:
|
|
| 166 |
to_private_checkbox = st.checkbox("To Private Repo", key="to_private_checkbox")
|
| 167 |
create_pr_checkbox = st.checkbox("Create PR (For Contribution 🤗)", key="create_pr_checkbox")
|
| 168 |
push_to_hub_button = st.button("Push to Hub", key="push_to_hub_button", use_container_width=True)
|
| 169 |
-
st.session_state['tokenizer'].save_pretrained(
|
| 170 |
-
with open(f"
|
| 171 |
|
| 172 |
tokenizer_config_content = json.loads(f.read())
|
|
|
|
| 173 |
|
| 174 |
st.download_button(
|
| 175 |
label="Download tokenizer_config.json",
|
|
@@ -195,3 +200,4 @@ if st.session_state['tokenizer_json'] is not None:
|
|
| 195 |
except Exception as e:
|
| 196 |
st.write(f"Repo id: {st.session_state['repo_id']}")
|
| 197 |
st.write(str(e))
|
|
|
|
|
|
| 21 |
def get_existing_templates():
|
| 22 |
return [None] + os.listdir("./templates")
|
| 23 |
|
| 24 |
+
# if os.path.exists("./tmp"):
|
| 25 |
+
# if len(os.listdir("./tmp")) > 20:
|
| 26 |
+
# shutil.rmtree('./tmp')
|
| 27 |
|
| 28 |
# Initialization
|
| 29 |
if 'tokenizer_json' not in st.session_state:
|
|
|
|
| 84 |
st.session_state['tokenizer'] = AutoTokenizer.from_pretrained(hf_model_repo_name)
|
| 85 |
|
| 86 |
st.session_state['repo_normalized_name'] = hf_model_repo_name.replace("/", "_")
|
|
|
|
| 87 |
st.session_state['tokenizer_json'] = f"./tmp/{st.session_state['uuid']}_{hf_model_repo_name}"
|
| 88 |
+
# st.session_state['tokenizer'].save_pretrained(st.session_state['tokenizer_json'])
|
| 89 |
|
| 90 |
if st.session_state['tokenizer_json'] is not None:
|
| 91 |
+
st.session_state['tokenizer'].save_pretrained(st.session_state['tokenizer_json'])
|
| 92 |
with open(f"{st.session_state['tokenizer_json']}/tokenizer_config.json", "rb") as f:
|
| 93 |
tokenizer_json = json.load(f)
|
| 94 |
+
shutil.rmtree(st.session_state['tokenizer_json'])
|
| 95 |
|
| 96 |
json_spec, col2 = st.columns(spec=[0.3, 0.7])
|
| 97 |
|
|
|
|
| 149 |
with open(f"./tmp/{st.session_state['uuid']}/tmp_chat_template.json", "r") as f:
|
| 150 |
jinja_lines = f.readlines()
|
| 151 |
st.session_state['tokenizer'].chat_template = sanitize_jinja2(jinja_lines)
|
| 152 |
+
os.remove(f"./tmp/{st.session_state['uuid']}/tmp_chat_template.json")
|
| 153 |
generated_prompt_wo_add_generation_prompt = st.session_state['tokenizer'].apply_chat_template(chat, tokenize=False, add_generation_prompt= False)
|
| 154 |
generated_prompt_w_add_generation_prompt = st.session_state['tokenizer'].apply_chat_template(chat, tokenize=False, add_generation_prompt= True)
|
| 155 |
|
|
|
|
| 170 |
to_private_checkbox = st.checkbox("To Private Repo", key="to_private_checkbox")
|
| 171 |
create_pr_checkbox = st.checkbox("Create PR (For Contribution 🤗)", key="create_pr_checkbox")
|
| 172 |
push_to_hub_button = st.button("Push to Hub", key="push_to_hub_button", use_container_width=True)
|
| 173 |
+
st.session_state['tokenizer'].save_pretrained(st.session_state['tokenizer_json'])
|
| 174 |
+
with open(f"{st.session_state['tokenizer_json']}/tokenizer_config.json", "r") as f:
|
| 175 |
|
| 176 |
tokenizer_config_content = json.loads(f.read())
|
| 177 |
+
shutil.rmtree(st.session_state['tokenizer_json'])
|
| 178 |
|
| 179 |
st.download_button(
|
| 180 |
label="Download tokenizer_config.json",
|
|
|
|
| 200 |
except Exception as e:
|
| 201 |
st.write(f"Repo id: {st.session_state['repo_id']}")
|
| 202 |
st.write(str(e))
|
| 203 |
+
os.remove(f"./tmp/{st.session_state['uuid']}/tmp_chat_template.json")
|