Skip to content

Commit eba9baf

Browse files
committed
update hf_compare notebook
1 parent 578e5cc commit eba9baf

File tree

1 file changed

+53
-59
lines changed

1 file changed

+53
-59
lines changed

notebooks/hf_compare.ipynb

Lines changed: 53 additions & 59 deletions
Original file line numberDiff line numberDiff line change
@@ -187,7 +187,7 @@
187187
{
188188
"data": {
189189
"application/vnd.jupyter.widget-view+json": {
190-
"model_id": "2ffb58863ba0436296433ed981dc49db",
190+
"model_id": "e21c690b98854a098fc213c986cdae58",
191191
"version_major": 2,
192192
"version_minor": 0
193193
},
@@ -261,8 +261,8 @@
261261
" translated_texts = list()\n",
262262
" for batch in get_batches(texts,batch_size=model.generation_config.batch_size):\n",
263263
" translated_tokens = model.generate(\n",
264-
" top_k=10,\n",
265-
" top_p=0.75,\n",
264+
" top_k=100,\n",
265+
" top_p=0.8,\n",
266266
" do_sample=True,\n",
267267
" temperature=0.9,\n",
268268
" **tokenizer(batch, return_tensors=\"pt\",padding=True),\n",
@@ -279,7 +279,7 @@
279279
{
280280
"data": {
281281
"application/vnd.jupyter.widget-view+json": {
282-
"model_id": "876bf053074348b9822ecc814931ad2c",
282+
"model_id": "a27619cff1ed4b7bb054e45a9df98465",
283283
"version_major": 2,
284284
"version_minor": 0
285285
},
@@ -315,15 +315,15 @@
315315
{
316316
"data": {
317317
"text/plain": [
318-
"{'score': 18.35116938665859,\n",
319-
" 'counts': [129, 61, 33, 19],\n",
320-
" 'totals': [268, 258, 248, 239],\n",
321-
" 'precisions': [48.134328358208954,\n",
322-
" 23.643410852713178,\n",
323-
" 13.306451612903226,\n",
324-
" 7.949790794979079],\n",
325-
" 'bp': 0.9851854581626466,\n",
326-
" 'sys_len': 268,\n",
318+
"{'score': 16.432731874855403,\n",
319+
" 'counts': [132, 60, 31, 14],\n",
320+
" 'totals': [277, 267, 257, 248],\n",
321+
" 'precisions': [47.65342960288809,\n",
322+
" 22.471910112359552,\n",
323+
" 12.062256809338521,\n",
324+
" 5.645161290322581],\n",
325+
" 'bp': 1.0,\n",
326+
" 'sys_len': 277,\n",
327327
" 'ref_len': 272}"
328328
]
329329
},
@@ -377,7 +377,7 @@
377377
{
378378
"data": {
379379
"application/vnd.jupyter.widget-view+json": {
380-
"model_id": "73dd3bbe56c14f7e9f847e2f5afb780b",
380+
"model_id": "8d09a5ef6f15448295ee3a91e744e854",
381381
"version_major": 2,
382382
"version_minor": 0
383383
},
@@ -451,8 +451,8 @@
451451
" translated_texts = list()\n",
452452
" for batch in get_batches(texts,batch_size=model.generation_config.batch_size):\n",
453453
" translated_tokens = model.generate(\n",
454-
" top_k=10,\n",
455-
" top_p=0.75,\n",
454+
" top_k=100,\n",
455+
" top_p=0.8,\n",
456456
" num_beams=4,\n",
457457
" do_sample=True,\n",
458458
" temperature=0.9,\n",
@@ -471,7 +471,7 @@
471471
{
472472
"data": {
473473
"application/vnd.jupyter.widget-view+json": {
474-
"model_id": "266b195603364b3a9d407108b786065d",
474+
"model_id": "3ed5415206ab4e7db92c1f78ac4662a0",
475475
"version_major": 2,
476476
"version_minor": 0
477477
},
@@ -507,13 +507,13 @@
507507
{
508508
"data": {
509509
"text/plain": [
510-
"{'score': 21.323465966136123,\n",
511-
" 'counts': [134, 68, 41, 24],\n",
510+
"{'score': 21.792077490044267,\n",
511+
" 'counts': [135, 69, 42, 25],\n",
512512
" 'totals': [262, 252, 242, 233],\n",
513-
" 'precisions': [51.14503816793893,\n",
514-
" 26.984126984126984,\n",
515-
" 16.94214876033058,\n",
516-
" 10.300429184549357],\n",
513+
" 'precisions': [51.52671755725191,\n",
514+
" 27.38095238095238,\n",
515+
" 17.355371900826448,\n",
516+
" 10.729613733905579],\n",
517517
" 'bp': 0.9625512774839297,\n",
518518
" 'sys_len': 262,\n",
519519
" 'ref_len': 272}"
@@ -653,7 +653,7 @@
653653
{
654654
"data": {
655655
"application/vnd.jupyter.widget-view+json": {
656-
"model_id": "25ce4ae39bfc43b1a3fbd4c8fd83262e",
656+
"model_id": "d0101acb14924ebc9b74f899d1a28095",
657657
"version_major": 2,
658658
"version_minor": 0
659659
},
@@ -719,16 +719,16 @@
719719
},
720720
{
721721
"cell_type": "code",
722-
"execution_count": 24,
722+
"execution_count": 36,
723723
"metadata": {},
724724
"outputs": [],
725725
"source": [
726726
"greedy_sequences_generator = GreedyGenerator(\n",
727727
" use_tqdm=True,\n",
728728
" temperature=0.9,\n",
729-
" top_k_sampling=10,\n",
730729
" sort_samples=True,\n",
731-
" top_p_sampling=0.75,\n",
730+
" top_k_sampling=100,\n",
731+
" top_p_sampling=0.8,\n",
732732
" device=model.device,\n",
733733
" multinomial_sampling=True,\n",
734734
" generation_forward=generate,\n",
@@ -741,13 +741,13 @@
741741
},
742742
{
743743
"cell_type": "code",
744-
"execution_count": 25,
744+
"execution_count": 37,
745745
"metadata": {},
746746
"outputs": [
747747
{
748748
"data": {
749749
"application/vnd.jupyter.widget-view+json": {
750-
"model_id": "cf2eef68941942f5aade85c0567aa0d2",
750+
"model_id": "e2c36cc8e29a4cd6bca9f30164f0a071",
751751
"version_major": 2,
752752
"version_minor": 0
753753
},
@@ -764,7 +764,7 @@
764764
"(10, 10, 10)"
765765
]
766766
},
767-
"execution_count": 25,
767+
"execution_count": 37,
768768
"metadata": {},
769769
"output_type": "execute_result"
770770
}
@@ -777,25 +777,22 @@
777777
},
778778
{
779779
"cell_type": "code",
780-
"execution_count": 26,
780+
"execution_count": 38,
781781
"metadata": {},
782782
"outputs": [
783783
{
784784
"data": {
785785
"text/plain": [
786-
"{'score': 9.729423488181931,\n",
787-
" 'counts': [109, 47, 19, 4],\n",
788-
" 'totals': [266, 256, 246, 237],\n",
789-
" 'precisions': [40.97744360902256,\n",
790-
" 18.359375,\n",
791-
" 7.723577235772358,\n",
792-
" 1.6877637130801688],\n",
793-
" 'bp': 0.9776961023999414,\n",
794-
" 'sys_len': 266,\n",
786+
"{'score': 16.963549254009152,\n",
787+
" 'counts': [133, 61, 31, 16],\n",
788+
" 'totals': [279, 269, 259, 250],\n",
789+
" 'precisions': [47.67025089605735, 22.676579925650557, 11.96911196911197, 6.4],\n",
790+
" 'bp': 1.0,\n",
791+
" 'sys_len': 279,\n",
795792
" 'ref_len': 272}"
796793
]
797794
},
798-
"execution_count": 26,
795+
"execution_count": 38,
799796
"metadata": {},
800797
"output_type": "execute_result"
801798
}
@@ -839,7 +836,7 @@
839836
{
840837
"data": {
841838
"application/vnd.jupyter.widget-view+json": {
842-
"model_id": "5eef67a1e84e4349a17cc22558cced89",
839+
"model_id": "ce3f41dcd2344d669478305a523a112d",
843840
"version_major": 2,
844841
"version_minor": 0
845842
},
@@ -905,7 +902,7 @@
905902
},
906903
{
907904
"cell_type": "code",
908-
"execution_count": 30,
905+
"execution_count": 33,
909906
"metadata": {},
910907
"outputs": [],
911908
"source": [
@@ -914,9 +911,9 @@
914911
" use_tqdm=True,\n",
915912
" temperature=0.9,\n",
916913
" sort_samples=True,\n",
917-
" top_k_sampling=10,\n",
914+
" top_k_sampling=100,\n",
918915
" length_penalty=0.6,\n",
919-
" top_p_sampling=0.75,\n",
916+
" top_p_sampling=0.8,\n",
920917
" device=model.device,\n",
921918
" multinomial_sampling=True,\n",
922919
" generation_forward=generate,\n",
@@ -929,13 +926,13 @@
929926
},
930927
{
931928
"cell_type": "code",
932-
"execution_count": 31,
929+
"execution_count": 34,
933930
"metadata": {},
934931
"outputs": [
935932
{
936933
"data": {
937934
"application/vnd.jupyter.widget-view+json": {
938-
"model_id": "3605ce4f5720498c911d50be793b674f",
935+
"model_id": "eb933bc8db5f4efc9491dfecb620c4e0",
939936
"version_major": 2,
940937
"version_minor": 0
941938
},
@@ -952,7 +949,7 @@
952949
"(10, 10, 10)"
953950
]
954951
},
955-
"execution_count": 31,
952+
"execution_count": 34,
956953
"metadata": {},
957954
"output_type": "execute_result"
958955
}
@@ -965,25 +962,22 @@
965962
},
966963
{
967964
"cell_type": "code",
968-
"execution_count": 32,
965+
"execution_count": 35,
969966
"metadata": {},
970967
"outputs": [
971968
{
972969
"data": {
973970
"text/plain": [
974-
"{'score': 20.27713611022614,\n",
975-
" 'counts': [135, 68, 38, 21],\n",
976-
" 'totals': [259, 249, 239, 230],\n",
977-
" 'precisions': [52.12355212355212,\n",
978-
" 27.309236947791163,\n",
979-
" 15.899581589958158,\n",
980-
" 9.130434782608695],\n",
981-
" 'bp': 0.951045807200927,\n",
982-
" 'sys_len': 259,\n",
971+
"{'score': 20.760619867696708,\n",
972+
" 'counts': [136, 69, 39, 22],\n",
973+
" 'totals': [260, 250, 240, 231],\n",
974+
" 'precisions': [52.30769230769231, 27.6, 16.25, 9.523809523809524],\n",
975+
" 'bp': 0.954895043959762,\n",
976+
" 'sys_len': 260,\n",
983977
" 'ref_len': 272}"
984978
]
985979
},
986-
"execution_count": 32,
980+
"execution_count": 35,
987981
"metadata": {},
988982
"output_type": "execute_result"
989983
}

0 commit comments

Comments
 (0)