Woao commited on Jun 5, 2024

Commit

7afa3ee

verified ·

1 Parent(s): 3f3b557

Upload folder using huggingface_hub

Browse files

Files changed (18) hide show

README.md +36 -0
checkpoint-2331/config.json +44 -0
checkpoint-2331/model.safetensors +3 -0
checkpoint-2331/optimizer.pt +3 -0
checkpoint-2331/rng_state.pth +3 -0
checkpoint-2331/scheduler.pt +3 -0
checkpoint-2331/trainer_state.json +747 -0
checkpoint-2331/training_args.bin +3 -0
config.json +44 -0
model.safetensors +3 -0
runs/Jun05_05-50-08_r-woao-chinese-class-s80cial6-94945-6uslq/events.out.tfevents.1717566610.r-woao-chinese-class-s80cial6-94945-6uslq.114.0 +2 -2
runs/Jun05_05-50-08_r-woao-chinese-class-s80cial6-94945-6uslq/events.out.tfevents.1717579625.r-woao-chinese-class-s80cial6-94945-6uslq.114.1 +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +57 -0
training_args.bin +3 -0
training_params.json +30 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,36 @@

+---
+tags:
+- autotrain
+- text-classification
+base_model: uer/roberta-base-finetuned-chinanews-chinese
+widget:
+- text: "I love AutoTrain"
+---
+# Model Trained Using AutoTrain
+- Problem type: Text Classification
+## Validation Metrics
+loss: 0.08590201288461685
+f1_macro: 0.9552925131881786
+f1_micro: 0.9736164736164736
+f1_weighted: 0.9730779143688454
+precision_macro: 0.9600774753043094
+precision_micro: 0.9736164736164736
+precision_weighted: 0.9743888843393359
+recall_macro: 0.9541124951907006
+recall_micro: 0.9736164736164736
+recall_weighted: 0.9736164736164736
+accuracy: 0.9736164736164736

checkpoint-2331/config.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "_name_or_path": "uer/roberta-base-finetuned-chinanews-chinese",
+  "_num_labels": 6,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "\u4e3b\u9898\u6d3b\u52a8",
+    "1": "\u5e38\u9a7b\u6d3b\u52a8",
+    "2": "\u65b0\u4eba\u6d3b\u52a8",
+    "3": "\u7279\u6743\u00b7\u57fa\u91d1\u00b7\u6218\u4ee4\u00b7\u5468\u5361",
+    "4": "\u8d27\u5e01\u5145\u503c",
+    "5": "\u9650\u65f6\u6d3b\u52a8"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "\u4e3b\u9898\u6d3b\u52a8": 0,
+    "\u5e38\u9a7b\u6d3b\u52a8": 1,
+    "\u65b0\u4eba\u6d3b\u52a8": 2,
+    "\u7279\u6743\u00b7\u57fa\u91d1\u00b7\u6218\u4ee4\u00b7\u5468\u5361": 3,
+    "\u8d27\u5e01\u5145\u503c": 4,
+    "\u9650\u65f6\u6d3b\u52a8": 5
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.41.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 21128
+}

checkpoint-2331/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34239ed338c349e0b355afe4a5d5940f1e2699bb75f2070d9dad7bf533b2df9c
+size 409112544

checkpoint-2331/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:106a2105bfdd5bbbd0916b0cbc19034775cc46fd1a967a481dbc103192537670
+size 818340602

checkpoint-2331/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fc7f61f749668a9aaf672694a631dc41e054c97cc1203b13d5e0b7c303dba86
+size 13990

checkpoint-2331/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e512932b9106cd1d1c30e2601797adbf6f8a52f8cb520bf71239496718e7bee
+size 1064

checkpoint-2331/trainer_state.json ADDED Viewed

	@@ -0,0 +1,747 @@

+{
+  "best_metric": 0.08590201288461685,
+  "best_model_checkpoint": "autotrain-EVENT/checkpoint-2331",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 2331,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.032175032175032175,
+      "grad_norm": 11.68185806274414,
+      "learning_rate": 5.341880341880342e-06,
+      "loss": 1.7842,
+      "step": 25
+    },
+    {
+      "epoch": 0.06435006435006435,
+      "grad_norm": 6.230990886688232,
+      "learning_rate": 1.0683760683760684e-05,
+      "loss": 1.1267,
+      "step": 50
+    },
+    {
+      "epoch": 0.09652509652509653,
+      "grad_norm": 4.519747257232666,
+      "learning_rate": 1.602564102564103e-05,
+      "loss": 0.7128,
+      "step": 75
+    },
+    {
+      "epoch": 0.1287001287001287,
+      "grad_norm": 1.394315481185913,
+      "learning_rate": 2.1367521367521368e-05,
+      "loss": 0.5326,
+      "step": 100
+    },
+    {
+      "epoch": 0.16087516087516088,
+      "grad_norm": 28.153669357299805,
+      "learning_rate": 2.670940170940171e-05,
+      "loss": 0.4819,
+      "step": 125
+    },
+    {
+      "epoch": 0.19305019305019305,
+      "grad_norm": 1.6043665409088135,
+      "learning_rate": 3.205128205128206e-05,
+      "loss": 0.354,
+      "step": 150
+    },
+    {
+      "epoch": 0.22522522522522523,
+      "grad_norm": 6.796542167663574,
+      "learning_rate": 3.739316239316239e-05,
+      "loss": 0.3478,
+      "step": 175
+    },
+    {
+      "epoch": 0.2574002574002574,
+      "grad_norm": 1.6112338304519653,
+      "learning_rate": 4.2735042735042735e-05,
+      "loss": 0.2892,
+      "step": 200
+    },
+    {
+      "epoch": 0.28957528957528955,
+      "grad_norm": 0.8286625742912292,
+      "learning_rate": 4.8076923076923084e-05,
+      "loss": 0.2734,
+      "step": 225
+    },
+    {
+      "epoch": 0.32175032175032175,
+      "grad_norm": 35.574424743652344,
+      "learning_rate": 4.961850262279447e-05,
+      "loss": 0.3152,
+      "step": 250
+    },
+    {
+      "epoch": 0.3539253539253539,
+      "grad_norm": 3.241590738296509,
+      "learning_rate": 4.9022412970910824e-05,
+      "loss": 0.166,
+      "step": 275
+    },
+    {
+      "epoch": 0.3861003861003861,
+      "grad_norm": 1.9818757772445679,
+      "learning_rate": 4.8426323319027184e-05,
+      "loss": 0.1839,
+      "step": 300
+    },
+    {
+      "epoch": 0.41827541827541825,
+      "grad_norm": 0.07353338599205017,
+      "learning_rate": 4.7830233667143544e-05,
+      "loss": 0.168,
+      "step": 325
+    },
+    {
+      "epoch": 0.45045045045045046,
+      "grad_norm": 17.200748443603516,
+      "learning_rate": 4.72341440152599e-05,
+      "loss": 0.2131,
+      "step": 350
+    },
+    {
+      "epoch": 0.4826254826254826,
+      "grad_norm": 0.17287948727607727,
+      "learning_rate": 4.663805436337626e-05,
+      "loss": 0.1893,
+      "step": 375
+    },
+    {
+      "epoch": 0.5148005148005148,
+      "grad_norm": 2.6518495082855225,
+      "learning_rate": 4.604196471149261e-05,
+      "loss": 0.1,
+      "step": 400
+    },
+    {
+      "epoch": 0.546975546975547,
+      "grad_norm": 0.2751850485801697,
+      "learning_rate": 4.5445875059608964e-05,
+      "loss": 0.2003,
+      "step": 425
+    },
+    {
+      "epoch": 0.5791505791505791,
+      "grad_norm": 0.1038702130317688,
+      "learning_rate": 4.4849785407725324e-05,
+      "loss": 0.1516,
+      "step": 450
+    },
+    {
+      "epoch": 0.6113256113256114,
+      "grad_norm": 3.7733001708984375,
+      "learning_rate": 4.425369575584168e-05,
+      "loss": 0.1621,
+      "step": 475
+    },
+    {
+      "epoch": 0.6435006435006435,
+      "grad_norm": 11.369443893432617,
+      "learning_rate": 4.365760610395804e-05,
+      "loss": 0.209,
+      "step": 500
+    },
+    {
+      "epoch": 0.6756756756756757,
+      "grad_norm": 1.2104507684707642,
+      "learning_rate": 4.30615164520744e-05,
+      "loss": 0.0893,
+      "step": 525
+    },
+    {
+      "epoch": 0.7078507078507078,
+      "grad_norm": 6.639780044555664,
+      "learning_rate": 4.246542680019075e-05,
+      "loss": 0.1771,
+      "step": 550
+    },
+    {
+      "epoch": 0.7400257400257401,
+      "grad_norm": 0.2439693808555603,
+      "learning_rate": 4.186933714830711e-05,
+      "loss": 0.149,
+      "step": 575
+    },
+    {
+      "epoch": 0.7722007722007722,
+      "grad_norm": 0.13589037954807281,
+      "learning_rate": 4.1273247496423464e-05,
+      "loss": 0.2146,
+      "step": 600
+    },
+    {
+      "epoch": 0.8043758043758044,
+      "grad_norm": 0.09856387972831726,
+      "learning_rate": 4.067715784453982e-05,
+      "loss": 0.2026,
+      "step": 625
+    },
+    {
+      "epoch": 0.8365508365508365,
+      "grad_norm": 8.529484748840332,
+      "learning_rate": 4.008106819265618e-05,
+      "loss": 0.1483,
+      "step": 650
+    },
+    {
+      "epoch": 0.8687258687258688,
+      "grad_norm": 0.18708932399749756,
+      "learning_rate": 3.948497854077253e-05,
+      "loss": 0.1885,
+      "step": 675
+    },
+    {
+      "epoch": 0.9009009009009009,
+      "grad_norm": 0.09533143043518066,
+      "learning_rate": 3.888888888888889e-05,
+      "loss": 0.0893,
+      "step": 700
+    },
+    {
+      "epoch": 0.9330759330759331,
+      "grad_norm": 1.1151599884033203,
+      "learning_rate": 3.829279923700525e-05,
+      "loss": 0.1439,
+      "step": 725
+    },
+    {
+      "epoch": 0.9652509652509652,
+      "grad_norm": 0.049121320247650146,
+      "learning_rate": 3.7696709585121604e-05,
+      "loss": 0.1269,
+      "step": 750
+    },
+    {
+      "epoch": 0.9974259974259975,
+      "grad_norm": 4.54576301574707,
+      "learning_rate": 3.7100619933237964e-05,
+      "loss": 0.058,
+      "step": 775
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9658944658944659,
+      "eval_f1_macro": 0.772591124028629,
+      "eval_f1_micro": 0.9658944658944659,
+      "eval_f1_weighted": 0.9654973088654933,
+      "eval_loss": 0.15877199172973633,
+      "eval_precision_macro": 0.7681480676677164,
+      "eval_precision_micro": 0.9658944658944659,
+      "eval_precision_weighted": 0.9664943022041425,
+      "eval_recall_macro": 0.7828568464611712,
+      "eval_recall_micro": 0.9658944658944659,
+      "eval_recall_weighted": 0.9658944658944659,
+      "eval_runtime": 250.4762,
+      "eval_samples_per_second": 6.204,
+      "eval_steps_per_second": 0.391,
+      "step": 777
+    },
+    {
+      "epoch": 1.0296010296010296,
+      "grad_norm": 0.06902267038822174,
+      "learning_rate": 3.650453028135432e-05,
+      "loss": 0.0681,
+      "step": 800
+    },
+    {
+      "epoch": 1.0617760617760619,
+      "grad_norm": 0.03424418717622757,
+      "learning_rate": 3.590844062947068e-05,
+      "loss": 0.1559,
+      "step": 825
+    },
+    {
+      "epoch": 1.093951093951094,
+      "grad_norm": 0.06254427880048752,
+      "learning_rate": 3.531235097758703e-05,
+      "loss": 0.0564,
+      "step": 850
+    },
+    {
+      "epoch": 1.1261261261261262,
+      "grad_norm": 0.13381192088127136,
+      "learning_rate": 3.4716261325703384e-05,
+      "loss": 0.1388,
+      "step": 875
+    },
+    {
+      "epoch": 1.1583011583011582,
+      "grad_norm": 14.801521301269531,
+      "learning_rate": 3.4120171673819744e-05,
+      "loss": 0.1437,
+      "step": 900
+    },
+    {
+      "epoch": 1.1904761904761905,
+      "grad_norm": 8.712313652038574,
+      "learning_rate": 3.35240820219361e-05,
+      "loss": 0.1262,
+      "step": 925
+    },
+    {
+      "epoch": 1.2226512226512227,
+      "grad_norm": 0.02129649743437767,
+      "learning_rate": 3.292799237005246e-05,
+      "loss": 0.101,
+      "step": 950
+    },
+    {
+      "epoch": 1.2548262548262548,
+      "grad_norm": 0.08888272196054459,
+      "learning_rate": 3.233190271816882e-05,
+      "loss": 0.2086,
+      "step": 975
+    },
+    {
+      "epoch": 1.287001287001287,
+      "grad_norm": 6.242756366729736,
+      "learning_rate": 3.173581306628517e-05,
+      "loss": 0.1234,
+      "step": 1000
+    },
+    {
+      "epoch": 1.3191763191763193,
+      "grad_norm": 0.01962357573211193,
+      "learning_rate": 3.113972341440153e-05,
+      "loss": 0.0653,
+      "step": 1025
+    },
+    {
+      "epoch": 1.3513513513513513,
+      "grad_norm": 18.92928695678711,
+      "learning_rate": 3.0543633762517884e-05,
+      "loss": 0.146,
+      "step": 1050
+    },
+    {
+      "epoch": 1.3835263835263836,
+      "grad_norm": 2.8306164741516113,
+      "learning_rate": 2.994754411063424e-05,
+      "loss": 0.1142,
+      "step": 1075
+    },
+    {
+      "epoch": 1.4157014157014158,
+      "grad_norm": 0.09596404433250427,
+      "learning_rate": 2.93514544587506e-05,
+      "loss": 0.1631,
+      "step": 1100
+    },
+    {
+      "epoch": 1.4478764478764479,
+      "grad_norm": 0.200534388422966,
+      "learning_rate": 2.8755364806866954e-05,
+      "loss": 0.0705,
+      "step": 1125
+    },
+    {
+      "epoch": 1.4800514800514801,
+      "grad_norm": 6.499765396118164,
+      "learning_rate": 2.815927515498331e-05,
+      "loss": 0.0771,
+      "step": 1150
+    },
+    {
+      "epoch": 1.5122265122265124,
+      "grad_norm": 0.01246571820229292,
+      "learning_rate": 2.756318550309967e-05,
+      "loss": 0.0237,
+      "step": 1175
+    },
+    {
+      "epoch": 1.5444015444015444,
+      "grad_norm": 106.53581237792969,
+      "learning_rate": 2.6967095851216024e-05,
+      "loss": 0.0858,
+      "step": 1200
+    },
+    {
+      "epoch": 1.5765765765765765,
+      "grad_norm": 0.30157119035720825,
+      "learning_rate": 2.637100619933238e-05,
+      "loss": 0.1932,
+      "step": 1225
+    },
+    {
+      "epoch": 1.6087516087516087,
+      "grad_norm": 0.030282437801361084,
+      "learning_rate": 2.5774916547448734e-05,
+      "loss": 0.0628,
+      "step": 1250
+    },
+    {
+      "epoch": 1.640926640926641,
+      "grad_norm": 0.01327039860188961,
+      "learning_rate": 2.5178826895565094e-05,
+      "loss": 0.0115,
+      "step": 1275
+    },
+    {
+      "epoch": 1.673101673101673,
+      "grad_norm": 0.3962545394897461,
+      "learning_rate": 2.458273724368145e-05,
+      "loss": 0.1223,
+      "step": 1300
+    },
+    {
+      "epoch": 1.7052767052767053,
+      "grad_norm": 0.060676004737615585,
+      "learning_rate": 2.3986647591797807e-05,
+      "loss": 0.1351,
+      "step": 1325
+    },
+    {
+      "epoch": 1.7374517374517375,
+      "grad_norm": 10.573041915893555,
+      "learning_rate": 2.3390557939914164e-05,
+      "loss": 0.0516,
+      "step": 1350
+    },
+    {
+      "epoch": 1.7696267696267696,
+      "grad_norm": 0.7964749932289124,
+      "learning_rate": 2.279446828803052e-05,
+      "loss": 0.0549,
+      "step": 1375
+    },
+    {
+      "epoch": 1.8018018018018018,
+      "grad_norm": 7.966588020324707,
+      "learning_rate": 2.2198378636146877e-05,
+      "loss": 0.155,
+      "step": 1400
+    },
+    {
+      "epoch": 1.833976833976834,
+      "grad_norm": 0.019958429038524628,
+      "learning_rate": 2.1602288984263234e-05,
+      "loss": 0.0414,
+      "step": 1425
+    },
+    {
+      "epoch": 1.8661518661518661,
+      "grad_norm": 4.273733615875244,
+      "learning_rate": 2.100619933237959e-05,
+      "loss": 0.1769,
+      "step": 1450
+    },
+    {
+      "epoch": 1.8983268983268984,
+      "grad_norm": 0.011619496159255505,
+      "learning_rate": 2.0410109680495947e-05,
+      "loss": 0.0598,
+      "step": 1475
+    },
+    {
+      "epoch": 1.9305019305019306,
+      "grad_norm": 3.8245315551757812,
+      "learning_rate": 1.9814020028612304e-05,
+      "loss": 0.1632,
+      "step": 1500
+    },
+    {
+      "epoch": 1.9626769626769627,
+      "grad_norm": 0.02121666446328163,
+      "learning_rate": 1.921793037672866e-05,
+      "loss": 0.0474,
+      "step": 1525
+    },
+    {
+      "epoch": 1.9948519948519947,
+      "grad_norm": 0.023423343896865845,
+      "learning_rate": 1.862184072484502e-05,
+      "loss": 0.0394,
+      "step": 1550
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9736164736164736,
+      "eval_f1_macro": 0.9559989029773911,
+      "eval_f1_micro": 0.9736164736164736,
+      "eval_f1_weighted": 0.9729748817677593,
+      "eval_loss": 0.10379565507173538,
+      "eval_precision_macro": 0.9641828592385946,
+      "eval_precision_micro": 0.9736164736164736,
+      "eval_precision_weighted": 0.9739386934178119,
+      "eval_recall_macro": 0.9503030193594619,
+      "eval_recall_micro": 0.9736164736164736,
+      "eval_recall_weighted": 0.9736164736164736,
+      "eval_runtime": 243.5935,
+      "eval_samples_per_second": 6.379,
+      "eval_steps_per_second": 0.402,
+      "step": 1554
+    },
+    {
+      "epoch": 2.027027027027027,
+      "grad_norm": 0.014448375441133976,
+      "learning_rate": 1.8025751072961374e-05,
+      "loss": 0.0738,
+      "step": 1575
+    },
+    {
+      "epoch": 2.0592020592020592,
+      "grad_norm": 1.0607327222824097,
+      "learning_rate": 1.742966142107773e-05,
+      "loss": 0.0453,
+      "step": 1600
+    },
+    {
+      "epoch": 2.0913770913770913,
+      "grad_norm": 0.034898240119218826,
+      "learning_rate": 1.6833571769194087e-05,
+      "loss": 0.1593,
+      "step": 1625
+    },
+    {
+      "epoch": 2.1235521235521237,
+      "grad_norm": 3.719592332839966,
+      "learning_rate": 1.6237482117310444e-05,
+      "loss": 0.105,
+      "step": 1650
+    },
+    {
+      "epoch": 2.155727155727156,
+      "grad_norm": 0.02683943510055542,
+      "learning_rate": 1.56413924654268e-05,
+      "loss": 0.0575,
+      "step": 1675
+    },
+    {
+      "epoch": 2.187902187902188,
+      "grad_norm": 0.014749615453183651,
+      "learning_rate": 1.5045302813543157e-05,
+      "loss": 0.0777,
+      "step": 1700
+    },
+    {
+      "epoch": 2.2200772200772203,
+      "grad_norm": 0.016101358458399773,
+      "learning_rate": 1.4449213161659514e-05,
+      "loss": 0.0226,
+      "step": 1725
+    },
+    {
+      "epoch": 2.2522522522522523,
+      "grad_norm": 0.18409115076065063,
+      "learning_rate": 1.385312350977587e-05,
+      "loss": 0.1178,
+      "step": 1750
+    },
+    {
+      "epoch": 2.2844272844272844,
+      "grad_norm": 0.012963847257196903,
+      "learning_rate": 1.3257033857892229e-05,
+      "loss": 0.0424,
+      "step": 1775
+    },
+    {
+      "epoch": 2.3166023166023164,
+      "grad_norm": 0.020922504365444183,
+      "learning_rate": 1.2660944206008585e-05,
+      "loss": 0.0916,
+      "step": 1800
+    },
+    {
+      "epoch": 2.348777348777349,
+      "grad_norm": 0.020266762003302574,
+      "learning_rate": 1.206485455412494e-05,
+      "loss": 0.0398,
+      "step": 1825
+    },
+    {
+      "epoch": 2.380952380952381,
+      "grad_norm": 0.011511508375406265,
+      "learning_rate": 1.1468764902241299e-05,
+      "loss": 0.047,
+      "step": 1850
+    },
+    {
+      "epoch": 2.413127413127413,
+      "grad_norm": 0.011209013871848583,
+      "learning_rate": 1.0872675250357654e-05,
+      "loss": 0.0416,
+      "step": 1875
+    },
+    {
+      "epoch": 2.4453024453024454,
+      "grad_norm": 0.019312728196382523,
+      "learning_rate": 1.027658559847401e-05,
+      "loss": 0.0408,
+      "step": 1900
+    },
+    {
+      "epoch": 2.4774774774774775,
+      "grad_norm": 0.015620889142155647,
+      "learning_rate": 9.680495946590367e-06,
+      "loss": 0.0712,
+      "step": 1925
+    },
+    {
+      "epoch": 2.5096525096525095,
+      "grad_norm": 0.010242036543786526,
+      "learning_rate": 9.084406294706724e-06,
+      "loss": 0.0537,
+      "step": 1950
+    },
+    {
+      "epoch": 2.5418275418275416,
+      "grad_norm": 0.03769510239362717,
+      "learning_rate": 8.488316642823082e-06,
+      "loss": 0.0723,
+      "step": 1975
+    },
+    {
+      "epoch": 2.574002574002574,
+      "grad_norm": 0.011480485089123249,
+      "learning_rate": 7.892226990939437e-06,
+      "loss": 0.0222,
+      "step": 2000
+    },
+    {
+      "epoch": 2.606177606177606,
+      "grad_norm": 5.9189887046813965,
+      "learning_rate": 7.296137339055794e-06,
+      "loss": 0.0555,
+      "step": 2025
+    },
+    {
+      "epoch": 2.6383526383526386,
+      "grad_norm": 0.09751153737306595,
+      "learning_rate": 6.700047687172151e-06,
+      "loss": 0.007,
+      "step": 2050
+    },
+    {
+      "epoch": 2.6705276705276706,
+      "grad_norm": 0.026520784944295883,
+      "learning_rate": 6.103958035288508e-06,
+      "loss": 0.03,
+      "step": 2075
+    },
+    {
+      "epoch": 2.7027027027027026,
+      "grad_norm": 0.007995215244591236,
+      "learning_rate": 5.507868383404864e-06,
+      "loss": 0.0968,
+      "step": 2100
+    },
+    {
+      "epoch": 2.7348777348777347,
+      "grad_norm": 0.015287132933735847,
+      "learning_rate": 4.911778731521221e-06,
+      "loss": 0.0496,
+      "step": 2125
+    },
+    {
+      "epoch": 2.767052767052767,
+      "grad_norm": 0.014539040625095367,
+      "learning_rate": 4.315689079637578e-06,
+      "loss": 0.0073,
+      "step": 2150
+    },
+    {
+      "epoch": 2.799227799227799,
+      "grad_norm": 0.011436503380537033,
+      "learning_rate": 3.7195994277539344e-06,
+      "loss": 0.0382,
+      "step": 2175
+    },
+    {
+      "epoch": 2.8314028314028317,
+      "grad_norm": 0.012776638381183147,
+      "learning_rate": 3.123509775870291e-06,
+      "loss": 0.0606,
+      "step": 2200
+    },
+    {
+      "epoch": 2.8635778635778637,
+      "grad_norm": 0.011094256304204464,
+      "learning_rate": 2.5274201239866477e-06,
+      "loss": 0.0281,
+      "step": 2225
+    },
+    {
+      "epoch": 2.8957528957528957,
+      "grad_norm": 3.787529706954956,
+      "learning_rate": 1.9313304721030048e-06,
+      "loss": 0.0462,
+      "step": 2250
+    },
+    {
+      "epoch": 2.9279279279279278,
+      "grad_norm": 0.49334508180618286,
+      "learning_rate": 1.3352408202193612e-06,
+      "loss": 0.0321,
+      "step": 2275
+    },
+    {
+      "epoch": 2.9601029601029603,
+      "grad_norm": 0.015266060829162598,
+      "learning_rate": 7.391511683357177e-07,
+      "loss": 0.0072,
+      "step": 2300
+    },
+    {
+      "epoch": 2.9922779922779923,
+      "grad_norm": 0.008497793227434158,
+      "learning_rate": 1.430615164520744e-07,
+      "loss": 0.0373,
+      "step": 2325
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9736164736164736,
+      "eval_f1_macro": 0.9552925131881786,
+      "eval_f1_micro": 0.9736164736164736,
+      "eval_f1_weighted": 0.9730779143688454,
+      "eval_loss": 0.08590201288461685,
+      "eval_precision_macro": 0.9600774753043094,
+      "eval_precision_micro": 0.9736164736164736,
+      "eval_precision_weighted": 0.9743888843393359,
+      "eval_recall_macro": 0.9541124951907006,
+      "eval_recall_micro": 0.9736164736164736,
+      "eval_recall_weighted": 0.9736164736164736,
+      "eval_runtime": 274.6108,
+      "eval_samples_per_second": 5.659,
+      "eval_steps_per_second": 0.357,
+      "step": 2331
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 2331,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 5,
+        "early_stopping_threshold": 0.01
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1226273112769536.0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-2331/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e74f5608d1ef20f887d78e8dcd203cb8bbc5c80f52e6eb90871344b27f884b8
+size 5112

config.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "_name_or_path": "uer/roberta-base-finetuned-chinanews-chinese",
+  "_num_labels": 6,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "\u4e3b\u9898\u6d3b\u52a8",
+    "1": "\u5e38\u9a7b\u6d3b\u52a8",
+    "2": "\u65b0\u4eba\u6d3b\u52a8",
+    "3": "\u7279\u6743\u00b7\u57fa\u91d1\u00b7\u6218\u4ee4\u00b7\u5468\u5361",
+    "4": "\u8d27\u5e01\u5145\u503c",
+    "5": "\u9650\u65f6\u6d3b\u52a8"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "\u4e3b\u9898\u6d3b\u52a8": 0,
+    "\u5e38\u9a7b\u6d3b\u52a8": 1,
+    "\u65b0\u4eba\u6d3b\u52a8": 2,
+    "\u7279\u6743\u00b7\u57fa\u91d1\u00b7\u6218\u4ee4\u00b7\u5468\u5361": 3,
+    "\u8d27\u5e01\u5145\u503c": 4,
+    "\u9650\u65f6\u6d3b\u52a8": 5
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.41.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 21128
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34239ed338c349e0b355afe4a5d5940f1e2699bb75f2070d9dad7bf533b2df9c
+size 409112544

runs/Jun05_05-50-08_r-woao-chinese-class-s80cial6-94945-6uslq/events.out.tfevents.1717566610.r-woao-chinese-class-s80cial6-94945-6uslq.114.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:061dcff7bfacc6474633b051dc80de61d56b076f6dcd588572c61fe15b920d01
-size 25655

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed0842a0c75ede460948edc551208663422bd7e52152f1842f0d5599f8bf9c8d
+size 27897

runs/Jun05_05-50-08_r-woao-chinese-class-s80cial6-94945-6uslq/events.out.tfevents.1717579625.r-woao-chinese-class-s80cial6-94945-6uslq.114.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd713155ae63ce0e64560d2986de471e12c958553b8432bcdeaa7ff07b4bfea2
+size 921

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 1000000000000000019884624838656,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e74f5608d1ef20f887d78e8dcd203cb8bbc5c80f52e6eb90871344b27f884b8
+size 5112

training_params.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+    "data_path": "autotrain-EVENT/autotrain-data",
+    "model": "uer/roberta-base-finetuned-chinanews-chinese",
+    "lr": 5e-05,
+    "epochs": 3,
+    "max_seq_length": 128,
+    "batch_size": 8,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 1,
+    "optimizer": "adamw_torch",
+    "scheduler": "linear",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "train_split": "train",
+    "valid_split": "validation",
+    "text_column": "autotrain_text",
+    "target_column": "autotrain_label",
+    "logging_steps": -1,
+    "project_name": "autotrain-EVENT",
+    "auto_find_batch_size": false,
+    "mixed_precision": "fp16",
+    "save_total_limit": 1,
+    "push_to_hub": true,
+    "evaluation_strategy": "epoch",
+    "username": "Woao",
+    "log": "tensorboard",
+    "early_stopping_patience": 5,
+    "early_stopping_threshold": 0.01
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff