Spaces:
Sleeping
Sleeping
app modified dataset reorden token
Browse files
app.py
CHANGED
@@ -364,7 +364,24 @@ class ModeloDataset:
|
|
364 |
i=i+1
|
365 |
labels = predicted_token_class_ids
|
366 |
loss = self.model(input_ids, labels=labels).loss
|
367 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
368 |
else:
|
369 |
|
370 |
print('idioma:',idioma)
|
|
|
364 |
i=i+1
|
365 |
labels = predicted_token_class_ids
|
366 |
loss = self.model(input_ids, labels=labels).loss
|
367 |
+
|
368 |
+
new_tokens=[]
|
369 |
+
ig_tok=[]
|
370 |
+
i=0
|
371 |
+
new_identificadores=[]
|
372 |
+
for item in tokenized_text:
|
373 |
+
|
374 |
+
aux1, aux2= self.reordenacion_tokens(item,"_")
|
375 |
+
new_tokens.append(aux1)
|
376 |
+
ig_tok.append(aux2)
|
377 |
+
|
378 |
+
|
379 |
+
for items in _predicted_tokens_classes:
|
380 |
+
aux=self.reordenacion_identificadores(ig_tok[i],items,len(new_tokens[i]))
|
381 |
+
new_identificadores.append(aux)
|
382 |
+
i=i+1
|
383 |
+
|
384 |
+
return new_identificadores, new_tokens#ids,_predicted_tokens_classes
|
385 |
else:
|
386 |
|
387 |
print('idioma:',idioma)
|