Spaces:
Running
Running
update
Browse files
app.py
CHANGED
@@ -217,7 +217,7 @@ with gr.Blocks(css="style.css") as demo:
|
|
217 |
|
218 |
user_input.change(tokenize_pair,
|
219 |
[user_input, tokenizer_type_1, tokenizer_type_2],
|
220 |
-
[output_text_1, output_table_1, output_text_2, output_table_2])
|
221 |
|
222 |
tokenizer_type_2.change(tokenize, [user_input, tokenizer_type_2],
|
223 |
[output_text_2, output_table_2])
|
|
|
217 |
|
218 |
user_input.change(tokenize_pair,
|
219 |
[user_input, tokenizer_type_1, tokenizer_type_2],
|
220 |
+
[output_text_1, output_table_1, output_text_2, output_table_2]) # , pass_request=1
|
221 |
|
222 |
tokenizer_type_2.change(tokenize, [user_input, tokenizer_type_2],
|
223 |
[output_text_2, output_table_2])
|
util.py
CHANGED
@@ -1,12 +1,13 @@
|
|
1 |
import gradio as gr
|
2 |
import json
|
|
|
3 |
import pandas as pd
|
4 |
from vocab import load_tokener
|
5 |
from utils.zh_util import iter_vocab
|
6 |
from utils.log_util import logger
|
7 |
|
8 |
|
9 |
-
def tokenize(text, tokenizer_type,
|
10 |
"""
|
11 |
TODO: cache tokenizer
|
12 |
"""
|
@@ -62,7 +63,16 @@ def tokenize(text, tokenizer_type, color_num=5, update=True):
|
|
62 |
return pos_tokens, table_df, len(encoding)
|
63 |
|
64 |
|
65 |
-
def tokenize_pair(text, tokenizer_type_1, tokenizer_type_2):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
66 |
pos_tokens_1, table_df_1 = tokenize(text, tokenizer_type_1)
|
67 |
pos_tokens_2, table_df_2 = tokenize(text, tokenizer_type_2)
|
68 |
return pos_tokens_1, table_df_1, pos_tokens_2, table_df_2
|
|
|
1 |
import gradio as gr
|
2 |
import json
|
3 |
+
import socket
|
4 |
import pandas as pd
|
5 |
from vocab import load_tokener
|
6 |
from utils.zh_util import iter_vocab
|
7 |
from utils.log_util import logger
|
8 |
|
9 |
|
10 |
+
def tokenize(text, tokenizer_type, color_num=5, update=True):
|
11 |
"""
|
12 |
TODO: cache tokenizer
|
13 |
"""
|
|
|
63 |
return pos_tokens, table_df, len(encoding)
|
64 |
|
65 |
|
66 |
+
def tokenize_pair(text, tokenizer_type_1, tokenizer_type_2, request: gr.Request):
|
67 |
+
if request:
|
68 |
+
client_ip = request.client.host
|
69 |
+
# local_ip = socket.gethostbyname(socket.gethostbyname(""))
|
70 |
+
headers = request.kwargs['headers']
|
71 |
+
if headers and 'x-forwarded-for' in headers:
|
72 |
+
x_forwarded_for = headers['x-forwarded-for']
|
73 |
+
client_ip = x_forwarded_for.split(' ')[0] if x_forwarded_for else ""
|
74 |
+
logger.info("[client ip]", client_ip, tokenizer_type_1, tokenizer_type_2)
|
75 |
+
|
76 |
pos_tokens_1, table_df_1 = tokenize(text, tokenizer_type_1)
|
77 |
pos_tokens_2, table_df_2 = tokenize(text, tokenizer_type_2)
|
78 |
return pos_tokens_1, table_df_1, pos_tokens_2, table_df_2
|