From 8cb7f201ad73a4d881ce67c04584964863f0666f Mon Sep 17 00:00:00 2001 From: Niels Horn Date: Tue, 27 Feb 2024 21:17:41 +0000 Subject: [PATCH] End of training --- .gitattributes | 1 + README.md | 21 +++++++++++++++++++-- all_results.json | 10 ++++++++++ eval_results.json | 10 ++++++++++ trainer_state.json | 3 +++ 5 files changed, 43 insertions(+), 2 deletions(-) create mode 100644 all_results.json create mode 100644 eval_results.json create mode 100644 trainer_state.json diff --git a/.gitattributes b/.gitattributes index a6344aa..9546427 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +trainer_state.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md index 74d8dfc..1e6d3e9 100644 --- a/README.md +++ b/README.md @@ -1,9 +1,23 @@ --- tags: - generated_from_trainer +datasets: +- roneneldan/TinyStories +metrics: +- accuracy model-index: - name: mistral-1L-tiny - results: [] + results: + - task: + name: Causal Language Modeling + type: text-generation + dataset: + name: roneneldan/TinyStories + type: roneneldan/TinyStories + metrics: + - name: Accuracy + type: accuracy + value: 0.5792084706530948 --- # mistral-1L-tiny -This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset. +This model is a fine-tuned version of [](https://huggingface.co/) on the roneneldan/TinyStories dataset. +It achieves the following results on the evaluation set: +- Loss: 1.6868 +- Accuracy: 0.5792 ## Model description diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..3fc5a86 --- /dev/null +++ b/all_results.json @@ -0,0 +1,10 @@ +{ + "epoch": 3.0, + "eval_accuracy": 0.5792084706530948, + "eval_loss": 1.6868340969085693, + "eval_runtime": 23.785, + "eval_samples": 19348, + "eval_samples_per_second": 813.455, + "eval_steps_per_second": 101.703, + "perplexity": 5.4023502853454595 +} \ No newline at end of file diff --git a/eval_results.json b/eval_results.json new file mode 100644 index 0000000..3fc5a86 --- /dev/null +++ b/eval_results.json @@ -0,0 +1,10 @@ +{ + "epoch": 3.0, + "eval_accuracy": 0.5792084706530948, + "eval_loss": 1.6868340969085693, + "eval_runtime": 23.785, + "eval_samples": 19348, + "eval_samples_per_second": 813.455, + "eval_steps_per_second": 101.703, + "perplexity": 5.4023502853454595 +} \ No newline at end of file diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..9a0aa2f --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce367bda1a7a853460ad56dafa3617b9cc9f33ef5b6deed0d5c7394de019e0d +size 14518582