cranky-coder08 commited on Sep 10

Commit

b48a35b

verified ·

1 Parent(s): fa85331

Add files using upload-large-folder tool

Browse files

Files changed (50) hide show

.gitattributes +5 -35
Dockerfile +24 -0
data/log_dataset.jsonl +0 -0
data_analyser.py +0 -0
docker-compose.yml +19 -0
merged_tinyllama_logger/config.json +29 -0
merged_tinyllama_logger/generation_config.json +7 -0
merged_tinyllama_logger/special_tokens_map.json +30 -0
merged_tinyllama_logger/tokenizer.json +0 -0
merged_tinyllama_logger/tokenizer_config.json +43 -0
merging_model.py +52 -0
model_output/incremental_1_logs/README.md +202 -0
model_output/incremental_1_logs/adapter_config.json +29 -0
model_output/incremental_1_logs/checkpoint-575/README.md +202 -0
model_output/incremental_1_logs/checkpoint-575/adapter_config.json +29 -0
model_output/incremental_1_logs/checkpoint-575/special_tokens_map.json +24 -0
model_output/incremental_1_logs/checkpoint-575/tokenizer.json +0 -0
model_output/incremental_1_logs/checkpoint-575/tokenizer_config.json +43 -0
model_output/incremental_1_logs/checkpoint-575/trainer_state.json +625 -0
model_output/incremental_1_logs/special_tokens_map.json +24 -0
model_output/incremental_1_logs/tokenizer.json +0 -0
model_output/incremental_1_logs/tokenizer_config.json +43 -0
model_output/phi2_finetuned_logs/README.md +202 -0
model_output/phi2_finetuned_logs/adapter_config.json +29 -0
model_output/phi2_finetuned_logs/special_tokens_map.json +24 -0
model_output/phi2_finetuned_logs/tokenizer.json +0 -0
model_output/phi2_finetuned_logs/tokenizer_config.json +43 -0
phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/INSTALLER +1 -0
phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/METADATA +77 -0
phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/RECORD +14 -0
phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/WHEEL +5 -0
phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/licenses/LICENSE +20 -0
phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/top_level.txt +1 -0
phivenv/Lib/site-packages/certifi/__init__.py +4 -0
phivenv/Lib/site-packages/certifi/__main__.py +12 -0
phivenv/Lib/site-packages/certifi/__pycache__/__init__.cpython-39.pyc +0 -0
phivenv/Lib/site-packages/certifi/__pycache__/__main__.cpython-39.pyc +0 -0
phivenv/Lib/site-packages/certifi/__pycache__/core.cpython-39.pyc +0 -0
phivenv/Lib/site-packages/certifi/cacert.pem +0 -0
phivenv/Lib/site-packages/certifi/core.py +83 -0
phivenv/Lib/site-packages/certifi/py.typed +0 -0
phivenv/Lib/site-packages/charset_normalizer/api.py +669 -0
phivenv/Lib/site-packages/isympy.py +342 -0
phivenv/Lib/site-packages/numpy-2.0.2-cp39-cp39-win_amd64.whl +0 -0
phivenv/Lib/site-packages/typing_extensions.py +0 -0
phivenv/pyvenv.cfg +3 -0
requirements.txt +0 -0
testing_merged_model.py +74 -0
training_phi2.py +107 -0
upload_to_hub.py +26 -0

.gitattributes CHANGED Viewed

@@ -1,35 +1,5 @@
-*.7z filter=lfs diff=lfs merge=lfs -text
-*.arrow filter=lfs diff=lfs merge=lfs -text
-*.bin filter=lfs diff=lfs merge=lfs -text
-*.bz2 filter=lfs diff=lfs merge=lfs -text
-*.ckpt filter=lfs diff=lfs merge=lfs -text
-*.ftz filter=lfs diff=lfs merge=lfs -text
-*.gz filter=lfs diff=lfs merge=lfs -text
-*.h5 filter=lfs diff=lfs merge=lfs -text
-*.joblib filter=lfs diff=lfs merge=lfs -text
-*.lfs.* filter=lfs diff=lfs merge=lfs -text
-*.mlmodel filter=lfs diff=lfs merge=lfs -text
-*.model filter=lfs diff=lfs merge=lfs -text
-*.msgpack filter=lfs diff=lfs merge=lfs -text
-*.npy filter=lfs diff=lfs merge=lfs -text
-*.npz filter=lfs diff=lfs merge=lfs -text
-*.onnx filter=lfs diff=lfs merge=lfs -text
-*.ot filter=lfs diff=lfs merge=lfs -text
-*.parquet filter=lfs diff=lfs merge=lfs -text
-*.pb filter=lfs diff=lfs merge=lfs -text
-*.pickle filter=lfs diff=lfs merge=lfs -text
-*.pkl filter=lfs diff=lfs merge=lfs -text
-*.pt filter=lfs diff=lfs merge=lfs -text
-*.pth filter=lfs diff=lfs merge=lfs -text
-*.rar filter=lfs diff=lfs merge=lfs -text
-*.safetensors filter=lfs diff=lfs merge=lfs -text
-saved_model/**/* filter=lfs diff=lfs merge=lfs -text
-*.tar.* filter=lfs diff=lfs merge=lfs -text
-*.tar filter=lfs diff=lfs merge=lfs -text
-*.tflite filter=lfs diff=lfs merge=lfs -text
-*.tgz filter=lfs diff=lfs merge=lfs -text
-*.wasm filter=lfs diff=lfs merge=lfs -text
-*.xz filter=lfs diff=lfs merge=lfs -text
-*.zip filter=lfs diff=lfs merge=lfs -text
-*.zst filter=lfs diff=lfs merge=lfs -text
-*tfevents* filter=lfs diff=lfs merge=lfs -text

+*.bin filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text

Dockerfile ADDED Viewed

	@@ -0,0 +1,24 @@

+FROM nvidia/cuda:12.1.1-devel-ubuntu22.04
+ENV DEBIAN_FRONTEND=noninteractive
+ENV PYTHONUNBUFFERED=1
+RUN apt-get update && \
+    apt-get install -y python3 python3-pip git build-essential && \
+    rm -rf /var/lib/apt/lists/*
+RUN pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
+RUN pip install transformers==4.42.3 \
+                peft==0.11.1 \
+                accelerate==0.30.1 \
+                bitsandbytes==0.43.1 \
+                trl==0.8.6 \
+                datasets==2.20.0 \
+                sentencepiece \
+                tensorboard
+WORKDIR /app
+COPY . /app
+# CMD ["python3", "train_phi2.py"]

data/log_dataset.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

data_analyser.py ADDED Viewed

The diff for this file is too large to render. See raw diff

docker-compose.yml ADDED Viewed

	@@ -0,0 +1,19 @@

+version: '3.8'
+services:
+  tiny_llama_tuning:
+    build: .
+    runtime: nvidia
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: all
+              capabilities: [gpu]
+    volumes:
+      - ./data:/app/data
+      - ./model_output:/app/model_output
+      - ./merged_tinyllama_logger:/app/merged_tinyllama_logger
+    command: python3 training_phi2.py

merged_tinyllama_logger/config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "_name_or_path": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 5632,
+  "max_position_embeddings": 2048,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 22,
+  "num_key_value_heads": 4,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 10000.0,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float16",
+  "transformers_version": "4.42.3",
+  "use_cache": true,
+  "vocab_size": 32000
+}

merged_tinyllama_logger/generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "max_length": 2048,
+  "pad_token_id": 0,
+  "transformers_version": "4.42.3"
+}

merged_tinyllama_logger/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

merged_tinyllama_logger/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

merged_tinyllama_logger/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": null,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n'  + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 2048,
+  "pad_token": "</s>",
+  "padding_side": "left",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}

merging_model.py ADDED Viewed

	@@ -0,0 +1,52 @@

+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from peft import PeftModel
+import os
+BASE_MODEL_NAME = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
+ADAPTER_CHECKPOINT_PATH = "./model_output/phi2_finetuned_logs/checkpoint-575"
+# D:\phi2_tuning\model_output\phi2_finetuned_logs\checkpoint-500
+MERGED_MODEL_PATH = "./updated_logger"
+print(f"loading base model from: {BASE_MODEL_NAME}")
+try:
+    base_model = AutoModelForCausalLM.from_pretrained(
+        BASE_MODEL_NAME,
+        low_cpu_mem_usage=True,
+        return_dict=True,
+        torch_dtype = torch.float16,
+        trust_remote_code=True,
+        device_map="auto"
+    )
+except Exception as e:
+    print(f"error loading model: {e}")
+    exit()
+tokenizer = AutoTokenizer.from_pretrained(
+    BASE_MODEL_NAME,
+    trust_remote_code=True
+)
+if tokenizer.pad_token is None:
+    tokenizer.pad_token = tokenizer.eos_token
+tokenizer.padding_side = "left"
+try:
+    model = PeftModel.from_pretrained(base_model, ADAPTER_CHECKPOINT_PATH)
+except Exception as e:
+    print(f"error loading the adapter checkpoint")
+    print("ensure the adapter checkpoint is correct and retry again")
+merged_model = model.merge_and_unload()
+print("adapters merged successfully!!")
+print("saving the merged model...")
+os.makedirs(MERGED_MODEL_PATH, exist_ok=True)
+merged_model.save_pretrained(MERGED_MODEL_PATH)
+tokenizer.save_pretrained(MERGED_MODEL_PATH)
+print(f"model merged and saved to {MERGED_MODEL_PATH}")

model_output/incremental_1_logs/README.md ADDED Viewed

	@@ -0,0 +1,202 @@

+---
+base_model: ./merged_tinyllama_logger
+library_name: peft
+---
+# Model Card for Model ID
+<!-- Provide a quick summary of what the model is/does. -->
+## Model Details
+### Model Description
+<!-- Provide a longer summary of what this model is. -->
+- **Developed by:** [More Information Needed]
+- **Funded by [optional]:** [More Information Needed]
+- **Shared by [optional]:** [More Information Needed]
+- **Model type:** [More Information Needed]
+- **Language(s) (NLP):** [More Information Needed]
+- **License:** [More Information Needed]
+- **Finetuned from model [optional]:** [More Information Needed]
+### Model Sources [optional]
+<!-- Provide the basic links for the model. -->
+- **Repository:** [More Information Needed]
+- **Paper [optional]:** [More Information Needed]
+- **Demo [optional]:** [More Information Needed]
+## Uses
+<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
+### Direct Use
+<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
+[More Information Needed]
+### Downstream Use [optional]
+<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
+[More Information Needed]
+### Out-of-Scope Use
+<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
+[More Information Needed]
+## Bias, Risks, and Limitations
+<!-- This section is meant to convey both technical and sociotechnical limitations. -->
+[More Information Needed]
+### Recommendations
+<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
+Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
+## How to Get Started with the Model
+Use the code below to get started with the model.
+[More Information Needed]
+## Training Details
+### Training Data
+<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
+[More Information Needed]
+### Training Procedure
+<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
+#### Preprocessing [optional]
+[More Information Needed]
+#### Training Hyperparameters
+- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
+#### Speeds, Sizes, Times [optional]
+<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
+[More Information Needed]
+## Evaluation
+<!-- This section describes the evaluation protocols and provides the results. -->
+### Testing Data, Factors & Metrics
+#### Testing Data
+<!-- This should link to a Dataset Card if possible. -->
+[More Information Needed]
+#### Factors
+<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
+[More Information Needed]
+#### Metrics
+<!-- These are the evaluation metrics being used, ideally with a description of why. -->
+[More Information Needed]
+### Results
+[More Information Needed]
+#### Summary
+## Model Examination [optional]
+<!-- Relevant interpretability work for the model goes here -->
+[More Information Needed]
+## Environmental Impact
+<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
+Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
+- **Hardware Type:** [More Information Needed]
+- **Hours used:** [More Information Needed]
+- **Cloud Provider:** [More Information Needed]
+- **Compute Region:** [More Information Needed]
+- **Carbon Emitted:** [More Information Needed]
+## Technical Specifications [optional]
+### Model Architecture and Objective
+[More Information Needed]
+### Compute Infrastructure
+[More Information Needed]
+#### Hardware
+[More Information Needed]
+#### Software
+[More Information Needed]
+## Citation [optional]
+<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
+**BibTeX:**
+[More Information Needed]
+**APA:**
+[More Information Needed]
+## Glossary [optional]
+<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
+[More Information Needed]
+## More Information [optional]
+[More Information Needed]
+## Model Card Authors [optional]
+[More Information Needed]
+## Model Card Contact
+[More Information Needed]
+### Framework versions
+- PEFT 0.11.1

model_output/incremental_1_logs/adapter_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "./merged_tinyllama_logger",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 124,
+  "lora_dropout": 0.15,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 32,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

model_output/incremental_1_logs/checkpoint-575/README.md ADDED Viewed

	@@ -0,0 +1,202 @@

+---
+base_model: ./merged_tinyllama_logger
+library_name: peft
+---
+# Model Card for Model ID
+<!-- Provide a quick summary of what the model is/does. -->
+## Model Details
+### Model Description
+<!-- Provide a longer summary of what this model is. -->
+- **Developed by:** [More Information Needed]
+- **Funded by [optional]:** [More Information Needed]
+- **Shared by [optional]:** [More Information Needed]
+- **Model type:** [More Information Needed]
+- **Language(s) (NLP):** [More Information Needed]
+- **License:** [More Information Needed]
+- **Finetuned from model [optional]:** [More Information Needed]
+### Model Sources [optional]
+<!-- Provide the basic links for the model. -->
+- **Repository:** [More Information Needed]
+- **Paper [optional]:** [More Information Needed]
+- **Demo [optional]:** [More Information Needed]
+## Uses
+<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
+### Direct Use
+<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
+[More Information Needed]
+### Downstream Use [optional]
+<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
+[More Information Needed]
+### Out-of-Scope Use
+<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
+[More Information Needed]
+## Bias, Risks, and Limitations
+<!-- This section is meant to convey both technical and sociotechnical limitations. -->
+[More Information Needed]
+### Recommendations
+<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
+Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
+## How to Get Started with the Model
+Use the code below to get started with the model.
+[More Information Needed]
+## Training Details
+### Training Data
+<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
+[More Information Needed]
+### Training Procedure
+<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
+#### Preprocessing [optional]
+[More Information Needed]
+#### Training Hyperparameters
+- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
+#### Speeds, Sizes, Times [optional]
+<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
+[More Information Needed]
+## Evaluation
+<!-- This section describes the evaluation protocols and provides the results. -->
+### Testing Data, Factors & Metrics
+#### Testing Data
+<!-- This should link to a Dataset Card if possible. -->
+[More Information Needed]
+#### Factors
+<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
+[More Information Needed]
+#### Metrics
+<!-- These are the evaluation metrics being used, ideally with a description of why. -->
+[More Information Needed]
+### Results
+[More Information Needed]
+#### Summary
+## Model Examination [optional]
+<!-- Relevant interpretability work for the model goes here -->
+[More Information Needed]
+## Environmental Impact
+<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
+Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
+- **Hardware Type:** [More Information Needed]
+- **Hours used:** [More Information Needed]
+- **Cloud Provider:** [More Information Needed]
+- **Compute Region:** [More Information Needed]
+- **Carbon Emitted:** [More Information Needed]
+## Technical Specifications [optional]
+### Model Architecture and Objective
+[More Information Needed]
+### Compute Infrastructure
+[More Information Needed]
+#### Hardware
+[More Information Needed]
+#### Software
+[More Information Needed]
+## Citation [optional]
+<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
+**BibTeX:**
+[More Information Needed]
+**APA:**
+[More Information Needed]
+## Glossary [optional]
+<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
+[More Information Needed]
+## More Information [optional]
+[More Information Needed]
+## Model Card Authors [optional]
+[More Information Needed]
+## Model Card Contact
+[More Information Needed]
+### Framework versions
+- PEFT 0.11.1

model_output/incremental_1_logs/checkpoint-575/adapter_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "./merged_tinyllama_logger",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 124,
+  "lora_dropout": 0.15,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 32,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

model_output/incremental_1_logs/checkpoint-575/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "</s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

model_output/incremental_1_logs/checkpoint-575/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

model_output/incremental_1_logs/checkpoint-575/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": null,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n'  + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 2048,
+  "pad_token": "</s>",
+  "padding_side": "right",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}

model_output/incremental_1_logs/checkpoint-575/trainer_state.json ADDED Viewed

	@@ -0,0 +1,625 @@

+{
+  "best_metric": 0.277375727891922,
+  "best_model_checkpoint": "/app/model_output/incremental_1_logs/checkpoint-575",
+  "epoch": 3.893355903512484,
+  "eval_steps": 25,
+  "global_step": 575,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.06771053745239103,
+      "grad_norm": 0.12689563632011414,
+      "learning_rate": 5.555555555555556e-05,
+      "loss": 0.3059,
+      "step": 10
+    },
+    {
+      "epoch": 0.13542107490478206,
+      "grad_norm": 0.20696839690208435,
+      "learning_rate": 9.999696229471716e-05,
+      "loss": 0.2664,
+      "step": 20
+    },
+    {
+      "epoch": 0.16927634363097757,
+      "eval_loss": 0.2852177023887634,
+      "eval_runtime": 88.5933,
+      "eval_samples_per_second": 11.852,
+      "eval_steps_per_second": 1.49,
+      "step": 25
+    },
+    {
+      "epoch": 0.20313161235717309,
+      "grad_norm": 0.15301378071308136,
+      "learning_rate": 9.989068136093873e-05,
+      "loss": 0.2856,
+      "step": 30
+    },
+    {
+      "epoch": 0.2708421498095641,
+      "grad_norm": 0.11013192683458328,
+      "learning_rate": 9.963288406760582e-05,
+      "loss": 0.3573,
+      "step": 40
+    },
+    {
+      "epoch": 0.33855268726195514,
+      "grad_norm": 0.11521229147911072,
+      "learning_rate": 9.922435333662536e-05,
+      "loss": 0.219,
+      "step": 50
+    },
+    {
+      "epoch": 0.33855268726195514,
+      "eval_loss": 0.286544531583786,
+      "eval_runtime": 83.9745,
+      "eval_samples_per_second": 12.504,
+      "eval_steps_per_second": 1.572,
+      "step": 50
+    },
+    {
+      "epoch": 0.40626322471434617,
+      "grad_norm": 0.11518555134534836,
+      "learning_rate": 9.86663298624003e-05,
+      "loss": 0.2929,
+      "step": 60
+    },
+    {
+      "epoch": 0.4739737621667372,
+      "grad_norm": 0.15488335490226746,
+      "learning_rate": 9.796050834388149e-05,
+      "loss": 0.3014,
+      "step": 70
+    },
+    {
+      "epoch": 0.5078290308929327,
+      "eval_loss": 0.2851661443710327,
+      "eval_runtime": 86.2574,
+      "eval_samples_per_second": 12.173,
+      "eval_steps_per_second": 1.53,
+      "step": 75
+    },
+    {
+      "epoch": 0.5416842996191282,
+      "grad_norm": 0.0932643935084343,
+      "learning_rate": 9.710903233782272e-05,
+      "loss": 0.2921,
+      "step": 80
+    },
+    {
+      "epoch": 0.6093948370715192,
+      "grad_norm": 0.12357372790575027,
+      "learning_rate": 9.611448774886924e-05,
+      "loss": 0.2477,
+      "step": 90
+    },
+    {
+      "epoch": 0.6771053745239103,
+      "grad_norm": 0.11050555109977722,
+      "learning_rate": 9.497989497625035e-05,
+      "loss": 0.2921,
+      "step": 100
+    },
+    {
+      "epoch": 0.6771053745239103,
+      "eval_loss": 0.28187423944473267,
+      "eval_runtime": 82.6427,
+      "eval_samples_per_second": 12.705,
+      "eval_steps_per_second": 1.597,
+      "step": 100
+    },
+    {
+      "epoch": 0.7448159119763013,
+      "grad_norm": 0.12379597127437592,
+      "learning_rate": 9.370869974092629e-05,
+      "loss": 0.3503,
+      "step": 110
+    },
+    {
+      "epoch": 0.8125264494286923,
+      "grad_norm": 0.09044498205184937,
+      "learning_rate": 9.230476262104677e-05,
+      "loss": 0.2187,
+      "step": 120
+    },
+    {
+      "epoch": 0.8463817181548878,
+      "eval_loss": 0.28196918964385986,
+      "eval_runtime": 81.0323,
+      "eval_samples_per_second": 12.958,
+      "eval_steps_per_second": 1.629,
+      "step": 125
+    },
+    {
+      "epoch": 0.8802369868810833,
+      "grad_norm": 0.08871851861476898,
+      "learning_rate": 9.077234732750224e-05,
+      "loss": 0.2651,
+      "step": 130
+    },
+    {
+      "epoch": 0.9479475243334744,
+      "grad_norm": 0.15373575687408447,
+      "learning_rate": 8.911610775517382e-05,
+      "loss": 0.2926,
+      "step": 140
+    },
+    {
+      "epoch": 1.0156580617858655,
+      "grad_norm": 0.1201297715306282,
+      "learning_rate": 8.73410738492077e-05,
+      "loss": 0.3611,
+      "step": 150
+    },
+    {
+      "epoch": 1.0156580617858655,
+      "eval_loss": 0.2829289138317108,
+      "eval_runtime": 69.3268,
+      "eval_samples_per_second": 15.146,
+      "eval_steps_per_second": 1.904,
+      "step": 150
+    },
+    {
+      "epoch": 1.0833685992382565,
+      "grad_norm": 0.0962260514497757,
+      "learning_rate": 8.545263632923687e-05,
+      "loss": 0.212,
+      "step": 160
+    },
+    {
+      "epoch": 1.1510791366906474,
+      "grad_norm": 0.11213065683841705,
+      "learning_rate": 8.345653031794292e-05,
+      "loss": 0.2705,
+      "step": 170
+    },
+    {
+      "epoch": 1.184934405416843,
+      "eval_loss": 0.28028643131256104,
+      "eval_runtime": 68.9818,
+      "eval_samples_per_second": 15.221,
+      "eval_steps_per_second": 1.914,
+      "step": 175
+    },
+    {
+      "epoch": 1.2187896741430384,
+      "grad_norm": 0.17710012197494507,
+      "learning_rate": 8.135881792367686e-05,
+      "loss": 0.2932,
+      "step": 180
+    },
+    {
+      "epoch": 1.2865002115954296,
+      "grad_norm": 0.08371994644403458,
+      "learning_rate": 7.916586983003533e-05,
+      "loss": 0.3095,
+      "step": 190
+    },
+    {
+      "epoch": 1.3542107490478206,
+      "grad_norm": 0.11087023466825485,
+      "learning_rate": 7.688434594830392e-05,
+      "loss": 0.2339,
+      "step": 200
+    },
+    {
+      "epoch": 1.3542107490478206,
+      "eval_loss": 0.280811071395874,
+      "eval_runtime": 69.3415,
+      "eval_samples_per_second": 15.142,
+      "eval_steps_per_second": 1.904,
+      "step": 200
+    },
+    {
+      "epoch": 1.4219212865002115,
+      "grad_norm": 0.08745381981134415,
+      "learning_rate": 7.452117519152542e-05,
+      "loss": 0.2833,
+      "step": 210
+    },
+    {
+      "epoch": 1.4896318239526027,
+      "grad_norm": 0.2609899342060089,
+      "learning_rate": 7.20835344316187e-05,
+      "loss": 0.325,
+      "step": 220
+    },
+    {
+      "epoch": 1.5234870926787982,
+      "eval_loss": 0.28064557909965515,
+      "eval_runtime": 66.8259,
+      "eval_samples_per_second": 15.712,
+      "eval_steps_per_second": 1.975,
+      "step": 225
+    },
+    {
+      "epoch": 1.5573423614049937,
+      "grad_norm": 0.09044867753982544,
+      "learning_rate": 6.957882670345458e-05,
+      "loss": 0.2485,
+      "step": 230
+    },
+    {
+      "epoch": 1.6250528988573847,
+      "grad_norm": 0.10336604714393616,
+      "learning_rate": 6.701465872208216e-05,
+      "loss": 0.2615,
+      "step": 240
+    },
+    {
+      "epoch": 1.6927634363097757,
+      "grad_norm": 0.11195653676986694,
+      "learning_rate": 6.439881778138531e-05,
+      "loss": 0.2872,
+      "step": 250
+    },
+    {
+      "epoch": 1.6927634363097757,
+      "eval_loss": 0.2789854109287262,
+      "eval_runtime": 71.8328,
+      "eval_samples_per_second": 14.617,
+      "eval_steps_per_second": 1.838,
+      "step": 250
+    },
+    {
+      "epoch": 1.7604739737621666,
+      "grad_norm": 0.08948034793138504,
+      "learning_rate": 6.173924810432705e-05,
+      "loss": 0.3233,
+      "step": 260
+    },
+    {
+      "epoch": 1.8281845112145576,
+      "grad_norm": 0.10628338903188705,
+      "learning_rate": 5.90440267166055e-05,
+      "loss": 0.2191,
+      "step": 270
+    },
+    {
+      "epoch": 1.8620397799407533,
+      "eval_loss": 0.27870360016822815,
+      "eval_runtime": 69.7018,
+      "eval_samples_per_second": 15.064,
+      "eval_steps_per_second": 1.894,
+      "step": 275
+    },
+    {
+      "epoch": 1.8958950486669488,
+      "grad_norm": 0.08356555551290512,
+      "learning_rate": 5.6321338916992315e-05,
+      "loss": 0.2827,
+      "step": 280
+    },
+    {
+      "epoch": 1.9636055861193398,
+      "grad_norm": 0.16241195797920227,
+      "learning_rate": 5.357945341884936e-05,
+      "loss": 0.3,
+      "step": 290
+    },
+    {
+      "epoch": 2.031316123571731,
+      "grad_norm": 0.09376996755599976,
+      "learning_rate": 5.0826697238317935e-05,
+      "loss": 0.3259,
+      "step": 300
+    },
+    {
+      "epoch": 2.031316123571731,
+      "eval_loss": 0.2795935571193695,
+      "eval_runtime": 66.8471,
+      "eval_samples_per_second": 15.707,
+      "eval_steps_per_second": 1.975,
+      "step": 300
+    },
+    {
+      "epoch": 2.099026661024122,
+      "grad_norm": 0.12176941335201263,
+      "learning_rate": 4.8071430405444474e-05,
+      "loss": 0.2162,
+      "step": 310
+    },
+    {
+      "epoch": 2.166737198476513,
+      "grad_norm": 0.10181087255477905,
+      "learning_rate": 4.5322020575044114e-05,
+      "loss": 0.2799,
+      "step": 320
+    },
+    {
+      "epoch": 2.2005924672027084,
+      "eval_loss": 0.2783721089363098,
+      "eval_runtime": 66.1795,
+      "eval_samples_per_second": 15.866,
+      "eval_steps_per_second": 1.995,
+      "step": 325
+    },
+    {
+      "epoch": 2.234447735928904,
+      "grad_norm": 0.16512344777584076,
+      "learning_rate": 4.2586817614407895e-05,
+      "loss": 0.3018,
+      "step": 330
+    },
+    {
+      "epoch": 2.302158273381295,
+      "grad_norm": 0.08763137459754944,
+      "learning_rate": 3.9874128245030404e-05,
+      "loss": 0.2788,
+      "step": 340
+    },
+    {
+      "epoch": 2.369868810833686,
+      "grad_norm": 0.17856952548027039,
+      "learning_rate": 3.719219081536942e-05,
+      "loss": 0.2435,
+      "step": 350
+    },
+    {
+      "epoch": 2.369868810833686,
+      "eval_loss": 0.27819639444351196,
+      "eval_runtime": 67.9684,
+      "eval_samples_per_second": 15.448,
+      "eval_steps_per_second": 1.942,
+      "step": 350
+    },
+    {
+      "epoch": 2.437579348286077,
+      "grad_norm": 0.10516191273927689,
+      "learning_rate": 3.4549150281252636e-05,
+      "loss": 0.2824,
+      "step": 360
+    },
+    {
+      "epoch": 2.505289885738468,
+      "grad_norm": 0.11505354195833206,
+      "learning_rate": 3.1953033469914276e-05,
+      "loss": 0.3472,
+      "step": 370
+    },
+    {
+      "epoch": 2.5391451544646637,
+      "eval_loss": 0.27820467948913574,
+      "eval_runtime": 71.3828,
+      "eval_samples_per_second": 14.709,
+      "eval_steps_per_second": 1.849,
+      "step": 375
+    },
+    {
+      "epoch": 2.573000423190859,
+      "grad_norm": 0.09948902577161789,
+      "learning_rate": 2.9411724702784758e-05,
+      "loss": 0.2087,
+      "step": 380
+    },
+    {
+      "epoch": 2.64071096064325,
+      "grad_norm": 0.10510896891355515,
+      "learning_rate": 2.693294185106562e-05,
+      "loss": 0.2713,
+      "step": 390
+    },
+    {
+      "epoch": 2.708421498095641,
+      "grad_norm": 0.1592397391796112,
+      "learning_rate": 2.4524212896808263e-05,
+      "loss": 0.2925,
+      "step": 400
+    },
+    {
+      "epoch": 2.708421498095641,
+      "eval_loss": 0.27774715423583984,
+      "eval_runtime": 71.1939,
+      "eval_samples_per_second": 14.748,
+      "eval_steps_per_second": 1.854,
+      "step": 400
+    },
+    {
+      "epoch": 2.776132035548032,
+      "grad_norm": 0.0951530858874321,
+      "learning_rate": 2.219285307067997e-05,
+      "loss": 0.2949,
+      "step": 410
+    },
+    {
+      "epoch": 2.843842573000423,
+      "grad_norm": 0.11100845783948898,
+      "learning_rate": 1.9945942635848748e-05,
+      "loss": 0.2293,
+      "step": 420
+    },
+    {
+      "epoch": 2.8776978417266186,
+      "eval_loss": 0.27757009863853455,
+      "eval_runtime": 68.4609,
+      "eval_samples_per_second": 15.337,
+      "eval_steps_per_second": 1.928,
+      "step": 425
+    },
+    {
+      "epoch": 2.911553110452814,
+      "grad_norm": 0.10450287908315659,
+      "learning_rate": 1.7790305385456795e-05,
+      "loss": 0.286,
+      "step": 430
+    },
+    {
+      "epoch": 2.9792636479052055,
+      "grad_norm": 0.22524423897266388,
+      "learning_rate": 1.5732487918985018e-05,
+      "loss": 0.3127,
+      "step": 440
+    },
+    {
+      "epoch": 3.0469741853575965,
+      "grad_norm": 0.09041011333465576,
+      "learning_rate": 1.3778739760445552e-05,
+      "loss": 0.2899,
+      "step": 450
+    },
+    {
+      "epoch": 3.0469741853575965,
+      "eval_loss": 0.2776949107646942,
+      "eval_runtime": 71.1823,
+      "eval_samples_per_second": 14.751,
+      "eval_steps_per_second": 1.854,
+      "step": 450
+    },
+    {
+      "epoch": 3.1146847228099874,
+      "grad_norm": 0.09738585352897644,
+      "learning_rate": 1.1934994378782772e-05,
+      "loss": 0.2271,
+      "step": 460
+    },
+    {
+      "epoch": 3.1823952602623784,
+      "grad_norm": 0.09352873265743256,
+      "learning_rate": 1.0206851168123077e-05,
+      "loss": 0.2823,
+      "step": 470
+    },
+    {
+      "epoch": 3.216250528988574,
+      "eval_loss": 0.2774777412414551,
+      "eval_runtime": 69.6841,
+      "eval_samples_per_second": 15.068,
+      "eval_steps_per_second": 1.894,
+      "step": 475
+    },
+    {
+      "epoch": 3.2501057977147694,
+      "grad_norm": 0.32003673911094666,
+      "learning_rate": 8.599558442598998e-06,
+      "loss": 0.344,
+      "step": 480
+    },
+    {
+      "epoch": 3.3178163351671603,
+      "grad_norm": 0.09081516414880753,
+      "learning_rate": 7.1179974973916486e-06,
+      "loss": 0.214,
+      "step": 490
+    },
+    {
+      "epoch": 3.3855268726195513,
+      "grad_norm": 0.11058734357357025,
+      "learning_rate": 5.766667784397706e-06,
+      "loss": 0.2584,
+      "step": 500
+    },
+    {
+      "epoch": 3.3855268726195513,
+      "eval_loss": 0.27743011713027954,
+      "eval_runtime": 70.1397,
+      "eval_samples_per_second": 14.97,
+      "eval_steps_per_second": 1.882,
+      "step": 500
+    },
+    {
+      "epoch": 3.4532374100719423,
+      "grad_norm": 0.11014135181903839,
+      "learning_rate": 4.549673247541875e-06,
+      "loss": 0.2854,
+      "step": 510
+    },
+    {
+      "epoch": 3.5209479475243333,
+      "grad_norm": 0.09463568776845932,
+      "learning_rate": 3.470709859234084e-06,
+      "loss": 0.316,
+      "step": 520
+    },
+    {
+      "epoch": 3.554803216250529,
+      "eval_loss": 0.2773997485637665,
+      "eval_runtime": 68.4347,
+      "eval_samples_per_second": 15.343,
+      "eval_steps_per_second": 1.929,
+      "step": 525
+    },
+    {
+      "epoch": 3.5886584849767242,
+      "grad_norm": 0.09929580241441727,
+      "learning_rate": 2.533054395822704e-06,
+      "loss": 0.2195,
+      "step": 530
+    },
+    {
+      "epoch": 3.6563690224291157,
+      "grad_norm": 0.0915316790342331,
+      "learning_rate": 1.7395544861325718e-06,
+      "loss": 0.2809,
+      "step": 540
+    },
+    {
+      "epoch": 3.7240795598815066,
+      "grad_norm": 0.17164337635040283,
+      "learning_rate": 1.0926199633097157e-06,
+      "loss": 0.3022,
+      "step": 550
+    },
+    {
+      "epoch": 3.7240795598815066,
+      "eval_loss": 0.27738305926322937,
+      "eval_runtime": 68.6988,
+      "eval_samples_per_second": 15.284,
+      "eval_steps_per_second": 1.921,
+      "step": 550
+    },
+    {
+      "epoch": 3.7917900973338976,
+      "grad_norm": 0.09638968855142593,
+      "learning_rate": 5.9421554623742e-07,
+      "loss": 0.2669,
+      "step": 560
+    },
+    {
+      "epoch": 3.8595006347862886,
+      "grad_norm": 0.18140298128128052,
+      "learning_rate": 2.458548727494292e-07,
+      "loss": 0.2454,
+      "step": 570
+    },
+    {
+      "epoch": 3.893355903512484,
+      "eval_loss": 0.277375727891922,
+      "eval_runtime": 72.7395,
+      "eval_samples_per_second": 14.435,
+      "eval_steps_per_second": 1.815,
+      "step": 575
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 588,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 25,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 7,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.485296471781376e+16,
+  "train_batch_size": 4,
+  "trial_name": null,
+  "trial_params": null
+}

model_output/incremental_1_logs/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "</s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

model_output/incremental_1_logs/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

model_output/incremental_1_logs/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": null,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n'  + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 2048,
+  "pad_token": "</s>",
+  "padding_side": "right",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}

model_output/phi2_finetuned_logs/README.md ADDED Viewed

	@@ -0,0 +1,202 @@

+---
+base_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+library_name: peft
+---
+# Model Card for Model ID
+<!-- Provide a quick summary of what the model is/does. -->
+## Model Details
+### Model Description
+<!-- Provide a longer summary of what this model is. -->
+- **Developed by:** [More Information Needed]
+- **Funded by [optional]:** [More Information Needed]
+- **Shared by [optional]:** [More Information Needed]
+- **Model type:** [More Information Needed]
+- **Language(s) (NLP):** [More Information Needed]
+- **License:** [More Information Needed]
+- **Finetuned from model [optional]:** [More Information Needed]
+### Model Sources [optional]
+<!-- Provide the basic links for the model. -->
+- **Repository:** [More Information Needed]
+- **Paper [optional]:** [More Information Needed]
+- **Demo [optional]:** [More Information Needed]
+## Uses
+<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
+### Direct Use
+<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
+[More Information Needed]
+### Downstream Use [optional]
+<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
+[More Information Needed]
+### Out-of-Scope Use
+<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
+[More Information Needed]
+## Bias, Risks, and Limitations
+<!-- This section is meant to convey both technical and sociotechnical limitations. -->
+[More Information Needed]
+### Recommendations
+<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
+Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
+## How to Get Started with the Model
+Use the code below to get started with the model.
+[More Information Needed]
+## Training Details
+### Training Data
+<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
+[More Information Needed]
+### Training Procedure
+<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
+#### Preprocessing [optional]
+[More Information Needed]
+#### Training Hyperparameters
+- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
+#### Speeds, Sizes, Times [optional]
+<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
+[More Information Needed]
+## Evaluation
+<!-- This section describes the evaluation protocols and provides the results. -->
+### Testing Data, Factors & Metrics
+#### Testing Data
+<!-- This should link to a Dataset Card if possible. -->
+[More Information Needed]
+#### Factors
+<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
+[More Information Needed]
+#### Metrics
+<!-- These are the evaluation metrics being used, ideally with a description of why. -->
+[More Information Needed]
+### Results
+[More Information Needed]
+#### Summary
+## Model Examination [optional]
+<!-- Relevant interpretability work for the model goes here -->
+[More Information Needed]
+## Environmental Impact
+<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
+Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
+- **Hardware Type:** [More Information Needed]
+- **Hours used:** [More Information Needed]
+- **Cloud Provider:** [More Information Needed]
+- **Compute Region:** [More Information Needed]
+- **Carbon Emitted:** [More Information Needed]
+## Technical Specifications [optional]
+### Model Architecture and Objective
+[More Information Needed]
+### Compute Infrastructure
+[More Information Needed]
+#### Hardware
+[More Information Needed]
+#### Software
+[More Information Needed]
+## Citation [optional]
+<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
+**BibTeX:**
+[More Information Needed]
+**APA:**
+[More Information Needed]
+## Glossary [optional]
+<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
+[More Information Needed]
+## More Information [optional]
+[More Information Needed]
+## Model Card Authors [optional]
+[More Information Needed]
+## Model Card Contact
+[More Information Needed]
+### Framework versions
+- PEFT 0.11.1

model_output/phi2_finetuned_logs/adapter_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 124,
+  "lora_dropout": 0.15,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 32,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "v_proj",
+    "q_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

model_output/phi2_finetuned_logs/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "</s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

model_output/phi2_finetuned_logs/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

model_output/phi2_finetuned_logs/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": null,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n'  + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 2048,
+  "pad_token": "</s>",
+  "padding_side": "right",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}

phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/INSTALLER ADDED Viewed

	@@ -0,0 +1 @@


1	+ pip

phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/METADATA ADDED Viewed

	@@ -0,0 +1,77 @@

+Metadata-Version: 2.4
+Name: certifi
+Version: 2025.8.3
+Summary: Python package for providing Mozilla's CA Bundle.
+Home-page: https://github.com/certifi/python-certifi
+Author: Kenneth Reitz
+Author-email: me@kennethreitz.com
+License: MPL-2.0
+Project-URL: Source, https://github.com/certifi/python-certifi
+Classifier: Development Status :: 5 - Production/Stable
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: Mozilla Public License 2.0 (MPL 2.0)
+Classifier: Natural Language :: English
+Classifier: Programming Language :: Python
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3 :: Only
+Classifier: Programming Language :: Python :: 3.7
+Classifier: Programming Language :: Python :: 3.8
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Requires-Python: >=3.7
+License-File: LICENSE
+Dynamic: author
+Dynamic: author-email
+Dynamic: classifier
+Dynamic: description
+Dynamic: home-page
+Dynamic: license
+Dynamic: license-file
+Dynamic: project-url
+Dynamic: requires-python
+Dynamic: summary
+Certifi: Python SSL Certificates
+================================
+Certifi provides Mozilla's carefully curated collection of Root Certificates for
+validating the trustworthiness of SSL certificates while verifying the identity
+of TLS hosts. It has been extracted from the `Requests`_ project.
+Installation
+------------
+``certifi`` is available on PyPI. Simply install it with ``pip``::
+    $ pip install certifi
+Usage
+-----
+To reference the installed certificate authority (CA) bundle, you can use the
+built-in function::
+    >>> import certifi
+    >>> certifi.where()
+    '/usr/local/lib/python3.7/site-packages/certifi/cacert.pem'
+Or from the command line::
+    $ python -m certifi
+    /usr/local/lib/python3.7/site-packages/certifi/cacert.pem
+Enjoy!
+.. _`Requests`: https://requests.readthedocs.io/en/master/
+Addition/Removal of Certificates
+--------------------------------
+Certifi does not support any addition/removal or other modification of the
+CA trust store content. This project is intended to provide a reliable and
+highly portable root of trust to python deployments. Look to upstream projects
+for methods to use alternate trust.

phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/RECORD ADDED Viewed

	@@ -0,0 +1,14 @@

+certifi-2025.8.3.dist-info/INSTALLER,sha256=zuuue4knoyJ-UwPPXg8fezS7VCrXJQrAP7zeNuwvFQg,4
+certifi-2025.8.3.dist-info/METADATA,sha256=z4sG3fosbP3nviub_TUpSb71z0bPmsp3Xa6ZIatGUe4,2422
+certifi-2025.8.3.dist-info/RECORD,,
+certifi-2025.8.3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+certifi-2025.8.3.dist-info/licenses/LICENSE,sha256=6TcW2mucDVpKHfYP5pWzcPBpVgPSH2-D8FPkLPwQyvc,989
+certifi-2025.8.3.dist-info/top_level.txt,sha256=KMu4vUCfsjLrkPbSNdgdekS-pVJzBAJFO__nI8NF6-U,8
+certifi/__init__.py,sha256=0a5ro4KTYep37Oo0Z8TycCPXaDlOEtvuj2pNWZ_1t8Y,94
+certifi/__main__.py,sha256=xBBoj905TUWBLRGANOcf7oi6e-3dMP4cEoG9OyMs11g,243
+certifi/__pycache__/__init__.cpython-39.pyc,,
+certifi/__pycache__/__main__.cpython-39.pyc,,
+certifi/__pycache__/core.cpython-39.pyc,,
+certifi/cacert.pem,sha256=kQLmo2RKBxumzb1KU2mPKRxKZLGEUKCLwEZUi221zIs,287634
+certifi/core.py,sha256=XFXycndG5pf37ayeF8N32HUuDafsyhkVMbO4BAPWHa0,3394
+certifi/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0

phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/WHEEL ADDED Viewed

	@@ -0,0 +1,5 @@

+Wheel-Version: 1.0
+Generator: setuptools (80.9.0)
+Root-Is-Purelib: true
+Tag: py3-none-any

phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/licenses/LICENSE ADDED Viewed

	@@ -0,0 +1,20 @@

+This package contains a modified version of ca-bundle.crt:
+ca-bundle.crt -- Bundle of CA Root Certificates
+This is a bundle of X.509 certificates of public Certificate Authorities
+(CA). These were automatically extracted from Mozilla's root certificates
+file (certdata.txt).  This file can be found in the mozilla source tree:
+https://hg.mozilla.org/mozilla-central/file/tip/security/nss/lib/ckfw/builtins/certdata.txt
+It contains the certificates in PEM format and therefore
+can be directly used with curl / libcurl / php_curl, or with
+an Apache+mod_ssl webserver for SSL client authentication.
+Just configure this file as the SSLCACertificateFile.#
+***** BEGIN LICENSE BLOCK *****
+This Source Code Form is subject to the terms of the Mozilla Public License,
+v. 2.0. If a copy of the MPL was not distributed with this file, You can obtain
+one at http://mozilla.org/MPL/2.0/.
+***** END LICENSE BLOCK *****
+@(#) $RCSfile: certdata.txt,v $ $Revision: 1.80 $ $Date: 2011/11/03 15:11:58 $

phivenv/Lib/site-packages/certifi-2025.8.3.dist-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ certifi

phivenv/Lib/site-packages/certifi/__init__.py ADDED Viewed

	@@ -0,0 +1,4 @@

+from .core import contents, where
+__all__ = ["contents", "where"]
+__version__ = "2025.08.03"

phivenv/Lib/site-packages/certifi/__main__.py ADDED Viewed

	@@ -0,0 +1,12 @@

+import argparse
+from certifi import contents, where
+parser = argparse.ArgumentParser()
+parser.add_argument("-c", "--contents", action="store_true")
+args = parser.parse_args()
+if args.contents:
+    print(contents())
+else:
+    print(where())

phivenv/Lib/site-packages/certifi/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (264 Bytes). View file

phivenv/Lib/site-packages/certifi/__pycache__/__main__.cpython-39.pyc ADDED Viewed

Binary file (400 Bytes). View file

phivenv/Lib/site-packages/certifi/__pycache__/core.cpython-39.pyc ADDED Viewed

Binary file (1.37 kB). View file

phivenv/Lib/site-packages/certifi/cacert.pem ADDED Viewed

The diff for this file is too large to render. See raw diff

phivenv/Lib/site-packages/certifi/core.py ADDED Viewed

	@@ -0,0 +1,83 @@

+"""
+certifi.py
+~~~~~~~~~~
+This module returns the installation location of cacert.pem or its contents.
+"""
+import sys
+import atexit
+def exit_cacert_ctx() -> None:
+    _CACERT_CTX.__exit__(None, None, None)  # type: ignore[union-attr]
+if sys.version_info >= (3, 11):
+    from importlib.resources import as_file, files
+    _CACERT_CTX = None
+    _CACERT_PATH = None
+    def where() -> str:
+        # This is slightly terrible, but we want to delay extracting the file
+        # in cases where we're inside of a zipimport situation until someone
+        # actually calls where(), but we don't want to re-extract the file
+        # on every call of where(), so we'll do it once then store it in a
+        # global variable.
+        global _CACERT_CTX
+        global _CACERT_PATH
+        if _CACERT_PATH is None:
+            # This is slightly janky, the importlib.resources API wants you to
+            # manage the cleanup of this file, so it doesn't actually return a
+            # path, it returns a context manager that will give you the path
+            # when you enter it and will do any cleanup when you leave it. In
+            # the common case of not needing a temporary file, it will just
+            # return the file system location and the __exit__() is a no-op.
+            #
+            # We also have to hold onto the actual context manager, because
+            # it will do the cleanup whenever it gets garbage collected, so
+            # we will also store that at the global level as well.
+            _CACERT_CTX = as_file(files("certifi").joinpath("cacert.pem"))
+            _CACERT_PATH = str(_CACERT_CTX.__enter__())
+            atexit.register(exit_cacert_ctx)
+        return _CACERT_PATH
+    def contents() -> str:
+        return files("certifi").joinpath("cacert.pem").read_text(encoding="ascii")
+else:
+    from importlib.resources import path as get_path, read_text
+    _CACERT_CTX = None
+    _CACERT_PATH = None
+    def where() -> str:
+        # This is slightly terrible, but we want to delay extracting the
+        # file in cases where we're inside of a zipimport situation until
+        # someone actually calls where(), but we don't want to re-extract
+        # the file on every call of where(), so we'll do it once then store
+        # it in a global variable.
+        global _CACERT_CTX
+        global _CACERT_PATH
+        if _CACERT_PATH is None:
+            # This is slightly janky, the importlib.resources API wants you
+            # to manage the cleanup of this file, so it doesn't actually
+            # return a path, it returns a context manager that will give
+            # you the path when you enter it and will do any cleanup when
+            # you leave it. In the common case of not needing a temporary
+            # file, it will just return the file system location and the
+            # __exit__() is a no-op.
+            #
+            # We also have to hold onto the actual context manager, because
+            # it will do the cleanup whenever it gets garbage collected, so
+            # we will also store that at the global level as well.
+            _CACERT_CTX = get_path("certifi", "cacert.pem")
+            _CACERT_PATH = str(_CACERT_CTX.__enter__())
+            atexit.register(exit_cacert_ctx)
+        return _CACERT_PATH
+    def contents() -> str:
+        return read_text("certifi", "cacert.pem", encoding="ascii")

phivenv/Lib/site-packages/certifi/py.typed ADDED Viewed

File without changes

phivenv/Lib/site-packages/charset_normalizer/api.py ADDED Viewed

	@@ -0,0 +1,669 @@

+from __future__ import annotations
+import logging
+from os import PathLike
+from typing import BinaryIO
+from .cd import (
+    coherence_ratio,
+    encoding_languages,
+    mb_encoding_languages,
+    merge_coherence_ratios,
+)
+from .constant import IANA_SUPPORTED, TOO_BIG_SEQUENCE, TOO_SMALL_SEQUENCE, TRACE
+from .md import mess_ratio
+from .models import CharsetMatch, CharsetMatches
+from .utils import (
+    any_specified_encoding,
+    cut_sequence_chunks,
+    iana_name,
+    identify_sig_or_bom,
+    is_cp_similar,
+    is_multi_byte_encoding,
+    should_strip_sig_or_bom,
+)
+logger = logging.getLogger("charset_normalizer")
+explain_handler = logging.StreamHandler()
+explain_handler.setFormatter(
+    logging.Formatter("%(asctime)s | %(levelname)s | %(message)s")
+)
+def from_bytes(
+    sequences: bytes | bytearray,
+    steps: int = 5,
+    chunk_size: int = 512,
+    threshold: float = 0.2,
+    cp_isolation: list[str] | None = None,
+    cp_exclusion: list[str] | None = None,
+    preemptive_behaviour: bool = True,
+    explain: bool = False,
+    language_threshold: float = 0.1,
+    enable_fallback: bool = True,
+) -> CharsetMatches:
+    """
+    Given a raw bytes sequence, return the best possibles charset usable to render str objects.
+    If there is no results, it is a strong indicator that the source is binary/not text.
+    By default, the process will extract 5 blocks of 512o each to assess the mess and coherence of a given sequence.
+    And will give up a particular code page after 20% of measured mess. Those criteria are customizable at will.
+    The preemptive behavior DOES NOT replace the traditional detection workflow, it prioritize a particular code page
+    but never take it for granted. Can improve the performance.
+    You may want to focus your attention to some code page or/and not others, use cp_isolation and cp_exclusion for that
+    purpose.
+    This function will strip the SIG in the payload/sequence every time except on UTF-16, UTF-32.
+    By default the library does not setup any handler other than the NullHandler, if you choose to set the 'explain'
+    toggle to True it will alter the logger configuration to add a StreamHandler that is suitable for debugging.
+    Custom logging format and handler can be set manually.
+    """
+    if not isinstance(sequences, (bytearray, bytes)):
+        raise TypeError(
+            "Expected object of type bytes or bytearray, got: {}".format(
+                type(sequences)
+            )
+        )
+    if explain:
+        previous_logger_level: int = logger.level
+        logger.addHandler(explain_handler)
+        logger.setLevel(TRACE)
+    length: int = len(sequences)
+    if length == 0:
+        logger.debug("Encoding detection on empty bytes, assuming utf_8 intention.")
+        if explain:  # Defensive: ensure exit path clean handler
+            logger.removeHandler(explain_handler)
+            logger.setLevel(previous_logger_level or logging.WARNING)
+        return CharsetMatches([CharsetMatch(sequences, "utf_8", 0.0, False, [], "")])
+    if cp_isolation is not None:
+        logger.log(
+            TRACE,
+            "cp_isolation is set. use this flag for debugging purpose. "
+            "limited list of encoding allowed : %s.",
+            ", ".join(cp_isolation),
+        )
+        cp_isolation = [iana_name(cp, False) for cp in cp_isolation]
+    else:
+        cp_isolation = []
+    if cp_exclusion is not None:
+        logger.log(
+            TRACE,
+            "cp_exclusion is set. use this flag for debugging purpose. "
+            "limited list of encoding excluded : %s.",
+            ", ".join(cp_exclusion),
+        )
+        cp_exclusion = [iana_name(cp, False) for cp in cp_exclusion]
+    else:
+        cp_exclusion = []
+    if length <= (chunk_size * steps):
+        logger.log(
+            TRACE,
+            "override steps (%i) and chunk_size (%i) as content does not fit (%i byte(s) given) parameters.",
+            steps,
+            chunk_size,
+            length,
+        )
+        steps = 1
+        chunk_size = length
+    if steps > 1 and length / steps < chunk_size:
+        chunk_size = int(length / steps)
+    is_too_small_sequence: bool = len(sequences) < TOO_SMALL_SEQUENCE
+    is_too_large_sequence: bool = len(sequences) >= TOO_BIG_SEQUENCE
+    if is_too_small_sequence:
+        logger.log(
+            TRACE,
+            "Trying to detect encoding from a tiny portion of ({}) byte(s).".format(
+                length
+            ),
+        )
+    elif is_too_large_sequence:
+        logger.log(
+            TRACE,
+            "Using lazy str decoding because the payload is quite large, ({}) byte(s).".format(
+                length
+            ),
+        )
+    prioritized_encodings: list[str] = []
+    specified_encoding: str | None = (
+        any_specified_encoding(sequences) if preemptive_behaviour else None
+    )
+    if specified_encoding is not None:
+        prioritized_encodings.append(specified_encoding)
+        logger.log(
+            TRACE,
+            "Detected declarative mark in sequence. Priority +1 given for %s.",
+            specified_encoding,
+        )
+    tested: set[str] = set()
+    tested_but_hard_failure: list[str] = []
+    tested_but_soft_failure: list[str] = []
+    fallback_ascii: CharsetMatch | None = None
+    fallback_u8: CharsetMatch | None = None
+    fallback_specified: CharsetMatch | None = None
+    results: CharsetMatches = CharsetMatches()
+    early_stop_results: CharsetMatches = CharsetMatches()
+    sig_encoding, sig_payload = identify_sig_or_bom(sequences)
+    if sig_encoding is not None:
+        prioritized_encodings.append(sig_encoding)
+        logger.log(
+            TRACE,
+            "Detected a SIG or BOM mark on first %i byte(s). Priority +1 given for %s.",
+            len(sig_payload),
+            sig_encoding,
+        )
+    prioritized_encodings.append("ascii")
+    if "utf_8" not in prioritized_encodings:
+        prioritized_encodings.append("utf_8")
+    for encoding_iana in prioritized_encodings + IANA_SUPPORTED:
+        if cp_isolation and encoding_iana not in cp_isolation:
+            continue
+        if cp_exclusion and encoding_iana in cp_exclusion:
+            continue
+        if encoding_iana in tested:
+            continue
+        tested.add(encoding_iana)
+        decoded_payload: str | None = None
+        bom_or_sig_available: bool = sig_encoding == encoding_iana
+        strip_sig_or_bom: bool = bom_or_sig_available and should_strip_sig_or_bom(
+            encoding_iana
+        )
+        if encoding_iana in {"utf_16", "utf_32"} and not bom_or_sig_available:
+            logger.log(
+                TRACE,
+                "Encoding %s won't be tested as-is because it require a BOM. Will try some sub-encoder LE/BE.",
+                encoding_iana,
+            )
+            continue
+        if encoding_iana in {"utf_7"} and not bom_or_sig_available:
+            logger.log(
+                TRACE,
+                "Encoding %s won't be tested as-is because detection is unreliable without BOM/SIG.",
+                encoding_iana,
+            )
+            continue
+        try:
+            is_multi_byte_decoder: bool = is_multi_byte_encoding(encoding_iana)
+        except (ModuleNotFoundError, ImportError):
+            logger.log(
+                TRACE,
+                "Encoding %s does not provide an IncrementalDecoder",
+                encoding_iana,
+            )
+            continue
+        try:
+            if is_too_large_sequence and is_multi_byte_decoder is False:
+                str(
+                    (
+                        sequences[: int(50e4)]
+                        if strip_sig_or_bom is False
+                        else sequences[len(sig_payload) : int(50e4)]
+                    ),
+                    encoding=encoding_iana,
+                )
+            else:
+                decoded_payload = str(
+                    (
+                        sequences
+                        if strip_sig_or_bom is False
+                        else sequences[len(sig_payload) :]
+                    ),
+                    encoding=encoding_iana,
+                )
+        except (UnicodeDecodeError, LookupError) as e:
+            if not isinstance(e, LookupError):
+                logger.log(
+                    TRACE,
+                    "Code page %s does not fit given bytes sequence at ALL. %s",
+                    encoding_iana,
+                    str(e),
+                )
+            tested_but_hard_failure.append(encoding_iana)
+            continue
+        similar_soft_failure_test: bool = False
+        for encoding_soft_failed in tested_but_soft_failure:
+            if is_cp_similar(encoding_iana, encoding_soft_failed):
+                similar_soft_failure_test = True
+                break
+        if similar_soft_failure_test:
+            logger.log(
+                TRACE,
+                "%s is deemed too similar to code page %s and was consider unsuited already. Continuing!",
+                encoding_iana,
+                encoding_soft_failed,
+            )
+            continue
+        r_ = range(
+            0 if not bom_or_sig_available else len(sig_payload),
+            length,
+            int(length / steps),
+        )
+        multi_byte_bonus: bool = (
+            is_multi_byte_decoder
+            and decoded_payload is not None
+            and len(decoded_payload) < length
+        )
+        if multi_byte_bonus:
+            logger.log(
+                TRACE,
+                "Code page %s is a multi byte encoding table and it appear that at least one character "
+                "was encoded using n-bytes.",
+                encoding_iana,
+            )
+        max_chunk_gave_up: int = int(len(r_) / 4)
+        max_chunk_gave_up = max(max_chunk_gave_up, 2)
+        early_stop_count: int = 0
+        lazy_str_hard_failure = False
+        md_chunks: list[str] = []
+        md_ratios = []
+        try:
+            for chunk in cut_sequence_chunks(
+                sequences,
+                encoding_iana,
+                r_,
+                chunk_size,
+                bom_or_sig_available,
+                strip_sig_or_bom,
+                sig_payload,
+                is_multi_byte_decoder,
+                decoded_payload,
+            ):
+                md_chunks.append(chunk)
+                md_ratios.append(
+                    mess_ratio(
+                        chunk,
+                        threshold,
+                        explain is True and 1 <= len(cp_isolation) <= 2,
+                    )
+                )
+                if md_ratios[-1] >= threshold:
+                    early_stop_count += 1
+                if (early_stop_count >= max_chunk_gave_up) or (
+                    bom_or_sig_available and strip_sig_or_bom is False
+                ):
+                    break
+        except (
+            UnicodeDecodeError
+        ) as e:  # Lazy str loading may have missed something there
+            logger.log(
+                TRACE,
+                "LazyStr Loading: After MD chunk decode, code page %s does not fit given bytes sequence at ALL. %s",
+                encoding_iana,
+                str(e),
+            )
+            early_stop_count = max_chunk_gave_up
+            lazy_str_hard_failure = True
+        # We might want to check the sequence again with the whole content
+        # Only if initial MD tests passes
+        if (
+            not lazy_str_hard_failure
+            and is_too_large_sequence
+            and not is_multi_byte_decoder
+        ):
+            try:
+                sequences[int(50e3) :].decode(encoding_iana, errors="strict")
+            except UnicodeDecodeError as e:
+                logger.log(
+                    TRACE,
+                    "LazyStr Loading: After final lookup, code page %s does not fit given bytes sequence at ALL. %s",
+                    encoding_iana,
+                    str(e),
+                )
+                tested_but_hard_failure.append(encoding_iana)
+                continue
+        mean_mess_ratio: float = sum(md_ratios) / len(md_ratios) if md_ratios else 0.0
+        if mean_mess_ratio >= threshold or early_stop_count >= max_chunk_gave_up:
+            tested_but_soft_failure.append(encoding_iana)
+            logger.log(
+                TRACE,
+                "%s was excluded because of initial chaos probing. Gave up %i time(s). "
+                "Computed mean chaos is %f %%.",
+                encoding_iana,
+                early_stop_count,
+                round(mean_mess_ratio * 100, ndigits=3),
+            )
+            # Preparing those fallbacks in case we got nothing.
+            if (
+                enable_fallback
+                and encoding_iana
+                in ["ascii", "utf_8", specified_encoding, "utf_16", "utf_32"]
+                and not lazy_str_hard_failure
+            ):
+                fallback_entry = CharsetMatch(
+                    sequences,
+                    encoding_iana,
+                    threshold,
+                    bom_or_sig_available,
+                    [],
+                    decoded_payload,
+                    preemptive_declaration=specified_encoding,
+                )
+                if encoding_iana == specified_encoding:
+                    fallback_specified = fallback_entry
+                elif encoding_iana == "ascii":
+                    fallback_ascii = fallback_entry
+                else:
+                    fallback_u8 = fallback_entry
+            continue
+        logger.log(
+            TRACE,
+            "%s passed initial chaos probing. Mean measured chaos is %f %%",
+            encoding_iana,
+            round(mean_mess_ratio * 100, ndigits=3),
+        )
+        if not is_multi_byte_decoder:
+            target_languages: list[str] = encoding_languages(encoding_iana)
+        else:
+            target_languages = mb_encoding_languages(encoding_iana)
+        if target_languages:
+            logger.log(
+                TRACE,
+                "{} should target any language(s) of {}".format(
+                    encoding_iana, str(target_languages)
+                ),
+            )
+        cd_ratios = []
+        # We shall skip the CD when its about ASCII
+        # Most of the time its not relevant to run "language-detection" on it.
+        if encoding_iana != "ascii":
+            for chunk in md_chunks:
+                chunk_languages = coherence_ratio(
+                    chunk,
+                    language_threshold,
+                    ",".join(target_languages) if target_languages else None,
+                )
+                cd_ratios.append(chunk_languages)
+        cd_ratios_merged = merge_coherence_ratios(cd_ratios)
+        if cd_ratios_merged:
+            logger.log(
+                TRACE,
+                "We detected language {} using {}".format(
+                    cd_ratios_merged, encoding_iana
+                ),
+            )
+        current_match = CharsetMatch(
+            sequences,
+            encoding_iana,
+            mean_mess_ratio,
+            bom_or_sig_available,
+            cd_ratios_merged,
+            (
+                decoded_payload
+                if (
+                    is_too_large_sequence is False
+                    or encoding_iana in [specified_encoding, "ascii", "utf_8"]
+                )
+                else None
+            ),
+            preemptive_declaration=specified_encoding,
+        )
+        results.append(current_match)
+        if (
+            encoding_iana in [specified_encoding, "ascii", "utf_8"]
+            and mean_mess_ratio < 0.1
+        ):
+            # If md says nothing to worry about, then... stop immediately!
+            if mean_mess_ratio == 0.0:
+                logger.debug(
+                    "Encoding detection: %s is most likely the one.",
+                    current_match.encoding,
+                )
+                if explain:  # Defensive: ensure exit path clean handler
+                    logger.removeHandler(explain_handler)
+                    logger.setLevel(previous_logger_level)
+                return CharsetMatches([current_match])
+            early_stop_results.append(current_match)
+        if (
+            len(early_stop_results)
+            and (specified_encoding is None or specified_encoding in tested)
+            and "ascii" in tested
+            and "utf_8" in tested
+        ):
+            probable_result: CharsetMatch = early_stop_results.best()  # type: ignore[assignment]
+            logger.debug(
+                "Encoding detection: %s is most likely the one.",
+                probable_result.encoding,
+            )
+            if explain:  # Defensive: ensure exit path clean handler
+                logger.removeHandler(explain_handler)
+                logger.setLevel(previous_logger_level)
+            return CharsetMatches([probable_result])
+        if encoding_iana == sig_encoding:
+            logger.debug(
+                "Encoding detection: %s is most likely the one as we detected a BOM or SIG within "
+                "the beginning of the sequence.",
+                encoding_iana,
+            )
+            if explain:  # Defensive: ensure exit path clean handler
+                logger.removeHandler(explain_handler)
+                logger.setLevel(previous_logger_level)
+            return CharsetMatches([results[encoding_iana]])
+    if len(results) == 0:
+        if fallback_u8 or fallback_ascii or fallback_specified:
+            logger.log(
+                TRACE,
+                "Nothing got out of the detection process. Using ASCII/UTF-8/Specified fallback.",
+            )
+        if fallback_specified:
+            logger.debug(
+                "Encoding detection: %s will be used as a fallback match",
+                fallback_specified.encoding,
+            )
+            results.append(fallback_specified)
+        elif (
+            (fallback_u8 and fallback_ascii is None)
+            or (
+                fallback_u8
+                and fallback_ascii
+                and fallback_u8.fingerprint != fallback_ascii.fingerprint
+            )
+            or (fallback_u8 is not None)
+        ):
+            logger.debug("Encoding detection: utf_8 will be used as a fallback match")
+            results.append(fallback_u8)
+        elif fallback_ascii:
+            logger.debug("Encoding detection: ascii will be used as a fallback match")
+            results.append(fallback_ascii)
+    if results:
+        logger.debug(
+            "Encoding detection: Found %s as plausible (best-candidate) for content. With %i alternatives.",
+            results.best().encoding,  # type: ignore
+            len(results) - 1,
+        )
+    else:
+        logger.debug("Encoding detection: Unable to determine any suitable charset.")
+    if explain:
+        logger.removeHandler(explain_handler)
+        logger.setLevel(previous_logger_level)
+    return results
+def from_fp(
+    fp: BinaryIO,
+    steps: int = 5,
+    chunk_size: int = 512,
+    threshold: float = 0.20,
+    cp_isolation: list[str] | None = None,
+    cp_exclusion: list[str] | None = None,
+    preemptive_behaviour: bool = True,
+    explain: bool = False,
+    language_threshold: float = 0.1,
+    enable_fallback: bool = True,
+) -> CharsetMatches:
+    """
+    Same thing than the function from_bytes but using a file pointer that is already ready.
+    Will not close the file pointer.
+    """
+    return from_bytes(
+        fp.read(),
+        steps,
+        chunk_size,
+        threshold,
+        cp_isolation,
+        cp_exclusion,
+        preemptive_behaviour,
+        explain,
+        language_threshold,
+        enable_fallback,
+    )
+def from_path(
+    path: str | bytes | PathLike,  # type: ignore[type-arg]
+    steps: int = 5,
+    chunk_size: int = 512,
+    threshold: float = 0.20,
+    cp_isolation: list[str] | None = None,
+    cp_exclusion: list[str] | None = None,
+    preemptive_behaviour: bool = True,
+    explain: bool = False,
+    language_threshold: float = 0.1,
+    enable_fallback: bool = True,
+) -> CharsetMatches:
+    """
+    Same thing than the function from_bytes but with one extra step. Opening and reading given file path in binary mode.
+    Can raise IOError.
+    """
+    with open(path, "rb") as fp:
+        return from_fp(
+            fp,
+            steps,
+            chunk_size,
+            threshold,
+            cp_isolation,
+            cp_exclusion,
+            preemptive_behaviour,
+            explain,
+            language_threshold,
+            enable_fallback,
+        )
+def is_binary(
+    fp_or_path_or_payload: PathLike | str | BinaryIO | bytes,  # type: ignore[type-arg]
+    steps: int = 5,
+    chunk_size: int = 512,
+    threshold: float = 0.20,
+    cp_isolation: list[str] | None = None,
+    cp_exclusion: list[str] | None = None,
+    preemptive_behaviour: bool = True,
+    explain: bool = False,
+    language_threshold: float = 0.1,
+    enable_fallback: bool = False,
+) -> bool:
+    """
+    Detect if the given input (file, bytes, or path) points to a binary file. aka. not a string.
+    Based on the same main heuristic algorithms and default kwargs at the sole exception that fallbacks match
+    are disabled to be stricter around ASCII-compatible but unlikely to be a string.
+    """
+    if isinstance(fp_or_path_or_payload, (str, PathLike)):
+        guesses = from_path(
+            fp_or_path_or_payload,
+            steps=steps,
+            chunk_size=chunk_size,
+            threshold=threshold,
+            cp_isolation=cp_isolation,
+            cp_exclusion=cp_exclusion,
+            preemptive_behaviour=preemptive_behaviour,
+            explain=explain,
+            language_threshold=language_threshold,
+            enable_fallback=enable_fallback,
+        )
+    elif isinstance(
+        fp_or_path_or_payload,
+        (
+            bytes,
+            bytearray,
+        ),
+    ):
+        guesses = from_bytes(
+            fp_or_path_or_payload,
+            steps=steps,
+            chunk_size=chunk_size,
+            threshold=threshold,
+            cp_isolation=cp_isolation,
+            cp_exclusion=cp_exclusion,
+            preemptive_behaviour=preemptive_behaviour,
+            explain=explain,
+            language_threshold=language_threshold,
+            enable_fallback=enable_fallback,
+        )
+    else:
+        guesses = from_fp(
+            fp_or_path_or_payload,
+            steps=steps,
+            chunk_size=chunk_size,
+            threshold=threshold,
+            cp_isolation=cp_isolation,
+            cp_exclusion=cp_exclusion,
+            preemptive_behaviour=preemptive_behaviour,
+            explain=explain,
+            language_threshold=language_threshold,
+            enable_fallback=enable_fallback,
+        )
+    return not guesses

phivenv/Lib/site-packages/isympy.py ADDED Viewed

	@@ -0,0 +1,342 @@

+"""
+Python shell for SymPy.
+This is just a normal Python shell (IPython shell if you have the
+IPython package installed), that executes the following commands for
+the user:
+    >>> from __future__ import division
+    >>> from sympy import *
+    >>> x, y, z, t = symbols('x y z t')
+    >>> k, m, n = symbols('k m n', integer=True)
+    >>> f, g, h = symbols('f g h', cls=Function)
+    >>> init_printing()
+So starting 'isympy' is equivalent to starting Python (or IPython) and
+executing the above commands by hand.  It is intended for easy and quick
+experimentation with SymPy.  isympy is a good way to use SymPy as an
+interactive calculator. If you have IPython and Matplotlib installed, then
+interactive plotting is enabled by default.
+COMMAND LINE OPTIONS
+--------------------
+-c CONSOLE, --console=CONSOLE
+     Use the specified shell (Python or IPython) shell as the console
+     backend instead of the default one (IPython if present, Python
+     otherwise), e.g.:
+        $isympy -c python
+    CONSOLE must be one of 'ipython' or 'python'
+-p PRETTY, --pretty PRETTY
+    Setup pretty-printing in SymPy. When pretty-printing is enabled,
+    expressions can be printed with Unicode or ASCII. The default is
+    to use pretty-printing (with Unicode if the terminal supports it).
+    When this option is 'no', expressions will not be pretty-printed
+    and ASCII will be used:
+        $isympy -p no
+    PRETTY must be one of 'unicode', 'ascii', or 'no'
+-t TYPES, --types=TYPES
+    Setup the ground types for the polys.  By default, gmpy ground types
+    are used if gmpy2 or gmpy is installed, otherwise it falls back to python
+    ground types, which are a little bit slower.  You can manually
+    choose python ground types even if gmpy is installed (e.g., for
+    testing purposes):
+        $isympy -t python
+    TYPES must be one of 'gmpy', 'gmpy1' or 'python'
+    Note that the ground type gmpy1 is primarily intended for testing; it
+    forces the use of gmpy version 1 even if gmpy2 is available.
+    This is the same as setting the environment variable
+    SYMPY_GROUND_TYPES to the given ground type (e.g.,
+    SYMPY_GROUND_TYPES='gmpy')
+    The ground types can be determined interactively from the variable
+    sympy.polys.domains.GROUND_TYPES.
+-o ORDER, --order ORDER
+    Setup the ordering of terms for printing.  The default is lex, which
+    orders terms lexicographically (e.g., x**2 + x + 1). You can choose
+    other orderings, such as rev-lex, which will use reverse
+    lexicographic ordering (e.g., 1 + x + x**2):
+        $isympy -o rev-lex
+    ORDER must be one of 'lex', 'rev-lex', 'grlex', 'rev-grlex',
+    'grevlex', 'rev-grevlex', 'old', or 'none'.
+    Note that for very large expressions, ORDER='none' may speed up
+    printing considerably but the terms will have no canonical order.
+-q, --quiet
+    Print only Python's and SymPy's versions to stdout at startup.
+-d, --doctest
+    Use the same format that should be used for doctests.  This is
+    equivalent to -c python -p no.
+-C, --no-cache
+    Disable the caching mechanism.  Disabling the cache may slow certain
+    operations down considerably.  This is useful for testing the cache,
+    or for benchmarking, as the cache can result in deceptive timings.
+    This is equivalent to setting the environment variable
+    SYMPY_USE_CACHE to 'no'.
+-a, --auto-symbols (requires at least IPython 0.11)
+    Automatically create missing symbols.  Normally, typing a name of a
+    Symbol that has not been instantiated first would raise NameError,
+    but with this option enabled, any undefined name will be
+    automatically created as a Symbol.
+    Note that this is intended only for interactive, calculator style
+    usage. In a script that uses SymPy, Symbols should be instantiated
+    at the top, so that it's clear what they are.
+    This will not override any names that are already defined, which
+    includes the single character letters represented by the mnemonic
+    QCOSINE (see the "Gotchas and Pitfalls" document in the
+    documentation). You can delete existing names by executing "del
+    name".  If a name is defined, typing "'name' in dir()" will return True.
+    The Symbols that are created using this have default assumptions.
+    If you want to place assumptions on symbols, you should create them
+    using symbols() or var().
+    Finally, this only works in the top level namespace. So, for
+    example, if you define a function in isympy with an undefined
+    Symbol, it will not work.
+    See also the -i and -I options.
+-i, --int-to-Integer (requires at least IPython 0.11)
+    Automatically wrap int literals with Integer.  This makes it so that
+    things like 1/2 will come out as Rational(1, 2), rather than 0.5.  This
+    works by preprocessing the source and wrapping all int literals with
+    Integer.  Note that this will not change the behavior of int literals
+    assigned to variables, and it also won't change the behavior of functions
+    that return int literals.
+    If you want an int, you can wrap the literal in int(), e.g. int(3)/int(2)
+    gives 1.5 (with division imported from __future__).
+-I, --interactive (requires at least IPython 0.11)
+    This is equivalent to --auto-symbols --int-to-Integer.  Future options
+    designed for ease of interactive use may be added to this.
+-D, --debug
+    Enable debugging output.  This is the same as setting the
+    environment variable SYMPY_DEBUG to 'True'.  The debug status is set
+    in the variable SYMPY_DEBUG within isympy.
+-- IPython options
+    Additionally you can pass command line options directly to the IPython
+    interpreter (the standard Python shell is not supported).  However you
+    need to add the '--' separator between two types of options, e.g the
+    startup banner option and the colors option. You need to enter the
+    options as required by the version of IPython that you are using, too:
+    in IPython 0.11,
+        $isympy -q -- --colors=NoColor
+    or older versions of IPython,
+        $isympy -q -- -colors NoColor
+See also isympy --help.
+"""
+import os
+import sys
+# DO NOT IMPORT SYMPY HERE! Or the setting of the sympy environment variables
+# by the command line will break.
+def main() -> None:
+    from argparse import ArgumentParser, RawDescriptionHelpFormatter
+    VERSION = None
+    if '--version' in sys.argv:
+        # We cannot import sympy before this is run, because flags like -C and
+        # -t set environment variables that must be set before SymPy is
+        # imported. The only thing we need to import it for is to get the
+        # version, which only matters with the --version flag.
+        import sympy
+        VERSION = sympy.__version__
+    usage = 'isympy [options] -- [ipython options]'
+    parser = ArgumentParser(
+        usage=usage,
+        description=__doc__,
+        formatter_class=RawDescriptionHelpFormatter,
+    )
+    parser.add_argument('--version', action='version', version=VERSION)
+    parser.add_argument(
+        '-c', '--console',
+        dest='console',
+        action='store',
+        default=None,
+        choices=['ipython', 'python'],
+        metavar='CONSOLE',
+        help='select type of interactive session: ipython | python; defaults '
+        'to ipython if IPython is installed, otherwise python')
+    parser.add_argument(
+        '-p', '--pretty',
+        dest='pretty',
+        action='store',
+        default=None,
+        metavar='PRETTY',
+        choices=['unicode', 'ascii', 'no'],
+        help='setup pretty printing: unicode | ascii | no; defaults to '
+        'unicode printing if the terminal supports it, otherwise ascii')
+    parser.add_argument(
+        '-t', '--types',
+        dest='types',
+        action='store',
+        default=None,
+        metavar='TYPES',
+        choices=['gmpy', 'gmpy1', 'python'],
+        help='setup ground types: gmpy | gmpy1 | python; defaults to gmpy if gmpy2 '
+        'or gmpy is installed, otherwise python')
+    parser.add_argument(
+        '-o', '--order',
+        dest='order',
+        action='store',
+        default=None,
+        metavar='ORDER',
+        choices=['lex', 'grlex', 'grevlex', 'rev-lex', 'rev-grlex', 'rev-grevlex', 'old', 'none'],
+        help='setup ordering of terms: [rev-]lex | [rev-]grlex | [rev-]grevlex | old | none; defaults to lex')
+    parser.add_argument(
+        '-q', '--quiet',
+        dest='quiet',
+        action='store_true',
+        default=False,
+        help='print only version information at startup')
+    parser.add_argument(
+        '-d', '--doctest',
+        dest='doctest',
+        action='store_true',
+        default=False,
+        help='use the doctest format for output (you can just copy and paste it)')
+    parser.add_argument(
+        '-C', '--no-cache',
+        dest='cache',
+        action='store_false',
+        default=True,
+        help='disable caching mechanism')
+    parser.add_argument(
+        '-a', '--auto-symbols',
+        dest='auto_symbols',
+        action='store_true',
+        default=False,
+        help='automatically construct missing symbols')
+    parser.add_argument(
+        '-i', '--int-to-Integer',
+        dest='auto_int_to_Integer',
+        action='store_true',
+        default=False,
+        help="automatically wrap int literals with Integer")
+    parser.add_argument(
+        '-I', '--interactive',
+        dest='interactive',
+        action='store_true',
+        default=False,
+        help="equivalent to -a -i")
+    parser.add_argument(
+        '-D', '--debug',
+        dest='debug',
+        action='store_true',
+        default=False,
+        help='enable debugging output')
+    (options, ipy_args) = parser.parse_known_args()
+    if '--' in ipy_args:
+        ipy_args.remove('--')
+    if not options.cache:
+        os.environ['SYMPY_USE_CACHE'] = 'no'
+    if options.types:
+        os.environ['SYMPY_GROUND_TYPES'] = options.types
+    if options.debug:
+        os.environ['SYMPY_DEBUG'] = str(options.debug)
+    if options.doctest:
+        options.pretty = 'no'
+        options.console = 'python'
+    session = options.console
+    if session is not None:
+        ipython = session == 'ipython'
+    else:
+        try:
+            import IPython # noqa: F401
+            ipython = True
+        except ImportError:
+            if not options.quiet:
+                from sympy.interactive.session import no_ipython
+                print(no_ipython)
+            ipython = False
+    args = {
+        'pretty_print': True,
+        'use_unicode':  None,
+        'use_latex':    None,
+        'order':        None,
+        'argv':         ipy_args,
+    }
+    if options.pretty == 'unicode':
+        args['use_unicode'] = True
+    elif options.pretty == 'ascii':
+        args['use_unicode'] = False
+    elif options.pretty == 'no':
+        args['pretty_print'] = False
+    if options.order is not None:
+        args['order'] = options.order
+    args['quiet'] = options.quiet
+    args['auto_symbols'] = options.auto_symbols or options.interactive
+    args['auto_int_to_Integer'] = options.auto_int_to_Integer or options.interactive
+    from sympy.interactive import init_session
+    init_session(ipython, **args)
+if __name__ == "__main__":
+    main()

phivenv/Lib/site-packages/numpy-2.0.2-cp39-cp39-win_amd64.whl ADDED Viewed

File without changes

phivenv/Lib/site-packages/typing_extensions.py ADDED Viewed

The diff for this file is too large to render. See raw diff

phivenv/pyvenv.cfg ADDED Viewed

	@@ -0,0 +1,3 @@

+home = C:\Users\aravi\AppData\Local\Programs\Python\Python39
+include-system-site-packages = false
+version = 3.9.13

requirements.txt ADDED Viewed

File without changes

testing_merged_model.py ADDED Viewed

	@@ -0,0 +1,74 @@

+import os
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+import traceback
+MERGED_MODEL_PATH = "./merged_tinyllama_logger"
+SAMPLE_LOG = """2023-03-06 15:38:41 ERROR [Worker-11] org.hibernate.exception.ConstraintViolationException at at com.example.CacheManager.land(CacheManager.java:359) at at com.example.ShippingService.discover(CacheManager.java:436) at at com.example.HttpClient.work(DatabaseConnector.java:494) at at com.example.ShippingService.window(OrderModule.java:378) at at com.example.CacheManager.almost(DatabaseConnector.java:326) at at com.example.DatabaseConnector.couple(AuthModule.java:13) at at com.example.PaymentModule.wrong(HttpClient.java:244)."""
+try:
+    model = AutoModelForCausalLM.from_pretrained(
+        MERGED_MODEL_PATH,
+        low_cpu_mem_usage= True,
+        return_dict = True,
+        torch_dtype = torch.float16,
+        device_map = "auto"
+    )
+    print("AutoModelForCausalLM loaded successfully.")
+    print("Loading AutoTokenizer...")
+    tokenizer = AutoTokenizer.from_pretrained(MERGED_MODEL_PATH)
+    print("AutoTokenizer loaded successfully.")
+except Exception as e:
+    print("ERROR LOADING MODEL OR TOKENIZER...CHECK PATH")
+    traceback.print_exc()
+if tokenizer is None:
+    print("error loading tokenizer")
+    exit(1)
+if tokenizer.pad_token is None:
+    tokenizer.pad_token = tokenizer.eos_token
+tokenizer.padding_side = "left"
+prompt = SAMPLE_LOG + "\n"
+inputs = tokenizer(prompt, return_tensors="pt", return_attention_mask=True).to(model.device)
+with torch.no_grad():
+    output_tokens = model.generate(
+        **inputs,
+        max_new_tokens=60,
+        temperature=0.3,
+        do_sample=True,
+        top_p=0.9,
+        top_k=30,
+        eos_token_id = tokenizer.eos_token_id,
+        pad_token_id = tokenizer.pad_token_id,
+        num_return_sequences = 1
+    )
+generated_text = tokenizer.decode(output_tokens[0], skip_special_tokens=True)
+print(f"Generated Text: {generated_text}")
+print("END OF GENERATED TEXT")
+#summary_start_index = generated_text.find(SAMPLE_LOG + "\n")
+# prompt_end_index = generated_text.rfind(
+summary_start_index = len(SAMPLE_LOG) + 1
+summary = ""
+if "PM" in generated_text:
+    summary_end_index = generated_text.rfind("PM") + len("PM")
+elif "AM" in generated_text:
+    summary_end_index = generated_text.rfind("AM") + len("AM")
+if summary_end_index != -1 and summary_end_index > summary_start_index:
+    summary = generated_text[len(SAMPLE_LOG)+1:summary_end_index].strip()
+else:
+    prompt_end_index = generated_text.find(SAMPLE_LOG + "\n")
+    if prompt_end_index != -1:
+        summary = generated_text[prompt_end_index + len(SAMPLE_LOG + "\n"):].strip()
+    else:
+        summary = generated_text.strip()
+print(summary)

training_phi2.py ADDED Viewed

	@@ -0,0 +1,107 @@

+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, TrainingArguments
+from transformers import EarlyStoppingCallback
+from peft import LoraConfig
+from trl import SFTTrainer
+from datasets import load_dataset
+import os
+NAME_OF_MODEL = "./merged_tinyllama_logger"
+DATASET_PATH = "/app/data/log_dataset.jsonl"
+OUTPUT_DIR = "/app/model_output/incremental_1_logs"
+os.makedirs(OUTPUT_DIR, exist_ok=True)
+#QUANTIZATION CONFIGURATION:
+bnb_config = BitsAndBytesConfig(
+    load_in_4bit = True,
+    bnb_4bit_quant_type = "nf4",
+    bnb_4bit_compute_dtype = torch.float16,
+    bnb_4bit_use_double_quant=True
+)
+lora_config = LoraConfig(
+    r=32,
+    lora_alpha=124,
+    bias="none",
+    lora_dropout=0.15,
+    task_type="CAUSAL_LM"
+)
+training_args = TrainingArguments(
+    output_dir = OUTPUT_DIR,
+    per_device_train_batch_size=4,
+    gradient_accumulation_steps=16,
+    learning_rate=1e-4,
+    weight_decay=0.001,
+    bf16=False,
+    max_grad_norm=0.3,
+    max_steps=-1,
+    warmup_ratio=0.03,
+    group_by_length=True,
+    lr_scheduler_type="cosine",
+    num_train_epochs=4,
+    logging_steps=10,
+    save_steps=25,
+    fp16=True,
+    optim="paged_adamw_8bit",
+    report_to=["tensorboard"],
+    eval_strategy="steps",
+    eval_steps=25,
+    load_best_model_at_end=True,
+    metric_for_best_model="eval_loss",
+    greater_is_better=False
+    )
+try:
+    dataset = load_dataset("json", data_files=DATASET_PATH)
+    split_dataset = dataset["train"].train_test_split(test_size=0.1, seed=42)
+    train_dataset = split_dataset["train"]
+    eval_dataset = split_dataset["test"]
+except Exception as e:
+    print(f"error loading dataset from {DATASET_PATH}: {e}")
+    exit(1)
+print("Loading model with Quantization")
+try:
+    model=AutoModelForCausalLM.from_pretrained(
+        NAME_OF_MODEL,
+        quantization_config = bnb_config,
+        device_map="auto",
+        trust_remote_code = True,
+        torch_dtype = torch.float16
+    )
+    model.config.pretraining_p=1
+    print("Model loaded successfully")
+except Exception as e:
+    print("ERROR LOADING MODEL: {e}")
+    exit(1)
+try:
+    tokenizer = AutoTokenizer.from_pretrained(NAME_OF_MODEL, trust_remote_code=True)
+    tokenizer.pad_token = tokenizer.eos_token
+    tokenizer.padding_side = "right"
+except Exception as e:
+    print('ERROR LOADING TOKENIZER: {e}')
+    exit(1)
+trainer=SFTTrainer(
+    model=model,
+    train_dataset= train_dataset,
+    eval_dataset=eval_dataset,
+    peft_config = lora_config,
+    dataset_text_field="text",
+    max_seq_length = 512,
+    tokenizer = tokenizer,
+    args=training_args,
+    packing=False,
+    callbacks=[EarlyStoppingCallback(early_stopping_patience=7)]
+)
+print("training started")
+trainer.train()
+print("fine tuning complete")
+trainer.save_model(OUTPUT_DIR)

upload_to_hub.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from huggingface_hub import HfApi
+# Your repository name on Hugging Face
+repo_id = "cranky-coder08/Phi2-Fine-Tuning"
+# The local folder to upload (the current directory, represented by ".")
+local_folder_path = "."
+# Your Hugging Face access token with "write" permissions
+# Replace with your actual token or leave it blank if you are already logged in
+# token = "hf_..."
+# Initialize the Hugging Face API client
+api = HfApi()
+# Upload the entire folder
+print(f"Uploading folder '{local_folder_path}' to '{repo_id}'...")
+api.upload_large_folder(
+    folder_path=local_folder_path,
+    repo_id=repo_id,
+    repo_type="model",
+    # Optional: Set a commit message
+    #commit_message="Initial upload of fine-tuned Phi2 model."
+)
+print("Upload complete!")