PrajnaShetty commited on
Commit
3d4c4c2
·
verified ·
1 Parent(s): 77cb6bd

Add arabert-lora v1 logged-model subtree (pyfunc bundle)

Browse files
Files changed (18) hide show
  1. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/MLmodel +39 -0
  2. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/README.md +206 -0
  3. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/adapter_config.json +46 -0
  4. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/adapter_model.safetensors +3 -0
  5. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/labels.json +1 -0
  6. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/pyfunc_meta.json +1 -0
  7. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/tokenizer.json +0 -0
  8. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/tokenizer_config.json +50 -0
  9. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/pyfunc_meta.json +1 -0
  10. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/conda.yaml +30 -0
  11. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/input_example.json +1 -0
  12. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/pyproject.toml +46 -0
  13. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/python_env.yaml +7 -0
  14. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/python_model.pkl +3 -0
  15. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/registered_model_meta +2 -0
  16. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/requirements.txt +22 -0
  17. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/serving_input_example.json +12 -0
  18. mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/uv.lock +0 -0
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/MLmodel ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ artifact_path: /Users/prajnashetty/Workspace/Arabic Sentiment Analysis/app/mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts
2
+ flavors:
3
+ python_function:
4
+ artifacts:
5
+ backend_type:
6
+ path: artifacts/pyfunc_meta.json
7
+ uri: models/arabert-lora-v1/pyfunc_meta.json
8
+ model_dir:
9
+ path: artifacts/arabert-lora-v1
10
+ uri: models/arabert-lora-v1
11
+ cloudpickle_version: 3.1.2
12
+ code: null
13
+ env:
14
+ conda: conda.yaml
15
+ virtualenv: python_env.yaml
16
+ loader_module: mlflow.pyfunc.model
17
+ python_model: python_model.pkl
18
+ python_version: 3.12.8
19
+ streamable: false
20
+ is_signature_from_type_hint: false
21
+ mlflow_version: 3.12.0
22
+ model_id: m-f9cac40424504a5a91d9449f38f5bd7c
23
+ model_size_bytes: 547201599
24
+ model_uuid: m-f9cac40424504a5a91d9449f38f5bd7c
25
+ prompts: null
26
+ run_id: 94cccbd929a845dd9e47d46a5c3db759
27
+ saved_input_example_info:
28
+ artifact_path: input_example.json
29
+ pandas_orient: split
30
+ serving_input_path: serving_input_example.json
31
+ type: dataframe
32
+ signature:
33
+ inputs: '[{"type": "string", "name": "text", "required": true}]'
34
+ outputs: '[{"type": "string", "name": "text", "required": true}, {"type": "string",
35
+ "name": "sentiment", "required": true}, {"type": "double", "name": "confidence",
36
+ "required": true}]'
37
+ params: null
38
+ type_hint_from_example: false
39
+ utc_time_created: '2026-05-22 18:09:03.492031'
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: aubmindlab/bert-base-arabertv2
3
+ library_name: peft
4
+ tags:
5
+ - base_model:adapter:aubmindlab/bert-base-arabertv2
6
+ - lora
7
+ - transformers
8
+ ---
9
+
10
+ # Model Card for Model ID
11
+
12
+ <!-- Provide a quick summary of what the model is/does. -->
13
+
14
+
15
+
16
+ ## Model Details
17
+
18
+ ### Model Description
19
+
20
+ <!-- Provide a longer summary of what this model is. -->
21
+
22
+
23
+
24
+ - **Developed by:** [More Information Needed]
25
+ - **Funded by [optional]:** [More Information Needed]
26
+ - **Shared by [optional]:** [More Information Needed]
27
+ - **Model type:** [More Information Needed]
28
+ - **Language(s) (NLP):** [More Information Needed]
29
+ - **License:** [More Information Needed]
30
+ - **Finetuned from model [optional]:** [More Information Needed]
31
+
32
+ ### Model Sources [optional]
33
+
34
+ <!-- Provide the basic links for the model. -->
35
+
36
+ - **Repository:** [More Information Needed]
37
+ - **Paper [optional]:** [More Information Needed]
38
+ - **Demo [optional]:** [More Information Needed]
39
+
40
+ ## Uses
41
+
42
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
43
+
44
+ ### Direct Use
45
+
46
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Downstream Use [optional]
51
+
52
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
53
+
54
+ [More Information Needed]
55
+
56
+ ### Out-of-Scope Use
57
+
58
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ## Bias, Risks, and Limitations
63
+
64
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
65
+
66
+ [More Information Needed]
67
+
68
+ ### Recommendations
69
+
70
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
71
+
72
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
73
+
74
+ ## How to Get Started with the Model
75
+
76
+ Use the code below to get started with the model.
77
+
78
+ [More Information Needed]
79
+
80
+ ## Training Details
81
+
82
+ ### Training Data
83
+
84
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
85
+
86
+ [More Information Needed]
87
+
88
+ ### Training Procedure
89
+
90
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
91
+
92
+ #### Preprocessing [optional]
93
+
94
+ [More Information Needed]
95
+
96
+
97
+ #### Training Hyperparameters
98
+
99
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
100
+
101
+ #### Speeds, Sizes, Times [optional]
102
+
103
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
104
+
105
+ [More Information Needed]
106
+
107
+ ## Evaluation
108
+
109
+ <!-- This section describes the evaluation protocols and provides the results. -->
110
+
111
+ ### Testing Data, Factors & Metrics
112
+
113
+ #### Testing Data
114
+
115
+ <!-- This should link to a Dataset Card if possible. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Factors
120
+
121
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
122
+
123
+ [More Information Needed]
124
+
125
+ #### Metrics
126
+
127
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
128
+
129
+ [More Information Needed]
130
+
131
+ ### Results
132
+
133
+ [More Information Needed]
134
+
135
+ #### Summary
136
+
137
+
138
+
139
+ ## Model Examination [optional]
140
+
141
+ <!-- Relevant interpretability work for the model goes here -->
142
+
143
+ [More Information Needed]
144
+
145
+ ## Environmental Impact
146
+
147
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
148
+
149
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
150
+
151
+ - **Hardware Type:** [More Information Needed]
152
+ - **Hours used:** [More Information Needed]
153
+ - **Cloud Provider:** [More Information Needed]
154
+ - **Compute Region:** [More Information Needed]
155
+ - **Carbon Emitted:** [More Information Needed]
156
+
157
+ ## Technical Specifications [optional]
158
+
159
+ ### Model Architecture and Objective
160
+
161
+ [More Information Needed]
162
+
163
+ ### Compute Infrastructure
164
+
165
+ [More Information Needed]
166
+
167
+ #### Hardware
168
+
169
+ [More Information Needed]
170
+
171
+ #### Software
172
+
173
+ [More Information Needed]
174
+
175
+ ## Citation [optional]
176
+
177
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
178
+
179
+ **BibTeX:**
180
+
181
+ [More Information Needed]
182
+
183
+ **APA:**
184
+
185
+ [More Information Needed]
186
+
187
+ ## Glossary [optional]
188
+
189
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
190
+
191
+ [More Information Needed]
192
+
193
+ ## More Information [optional]
194
+
195
+ [More Information Needed]
196
+
197
+ ## Model Card Authors [optional]
198
+
199
+ [More Information Needed]
200
+
201
+ ## Model Card Contact
202
+
203
+ [More Information Needed]
204
+ ### Framework versions
205
+
206
+ - PEFT 0.19.1
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/adapter_config.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": null,
6
+ "base_model_name_or_path": "aubmindlab/bert-base-arabertv2",
7
+ "bias": "none",
8
+ "corda_config": null,
9
+ "ensure_weight_tying": false,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 16,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.1,
22
+ "lora_ga_config": null,
23
+ "megatron_config": null,
24
+ "megatron_core": "megatron.core",
25
+ "modules_to_save": [
26
+ "classifier",
27
+ "score"
28
+ ],
29
+ "peft_type": "LORA",
30
+ "peft_version": "0.19.1",
31
+ "qalora_group_size": 16,
32
+ "r": 8,
33
+ "rank_pattern": {},
34
+ "revision": null,
35
+ "target_modules": [
36
+ "value",
37
+ "query"
38
+ ],
39
+ "target_parameters": null,
40
+ "task_type": "SEQ_CLS",
41
+ "trainable_token_indices": null,
42
+ "use_bdlora": null,
43
+ "use_dora": false,
44
+ "use_qalora": false,
45
+ "use_rslora": false
46
+ }
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ede973351e6bf26581ffbf3c00513ea563be855ed41e1c8165343b4fae91178
3
+ size 1195748
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/labels.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["positive", "negative", "neutral"]
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/pyfunc_meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"backend_type": "arabert-lora"}
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/arabert-lora-v1/tokenizer_config.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "cls_token": "[CLS]",
4
+ "do_basic_tokenize": true,
5
+ "do_lower_case": false,
6
+ "is_local": false,
7
+ "local_files_only": false,
8
+ "mask_token": "[MASK]",
9
+ "max_len": 512,
10
+ "model_max_length": 512,
11
+ "never_split": [
12
+ "+ك",
13
+ "+كما",
14
+ "ك+",
15
+ "+وا",
16
+ "+ين",
17
+ "و+",
18
+ "+كن",
19
+ "+ان",
20
+ "+هم",
21
+ "+ة",
22
+ "[بريد]",
23
+ "لل+",
24
+ "+ي",
25
+ "+ت",
26
+ "+ن",
27
+ "س+",
28
+ "ل+",
29
+ "[مستخدم]",
30
+ "+كم",
31
+ "+ا",
32
+ "ب+",
33
+ "ف+",
34
+ "+نا",
35
+ "+ها",
36
+ "+ون",
37
+ "+هما",
38
+ "ال+",
39
+ "+ه",
40
+ "+هن",
41
+ "+ات",
42
+ "[رابط]"
43
+ ],
44
+ "pad_token": "[PAD]",
45
+ "sep_token": "[SEP]",
46
+ "strip_accents": null,
47
+ "tokenize_chinese_chars": true,
48
+ "tokenizer_class": "BertTokenizer",
49
+ "unk_token": "[UNK]"
50
+ }
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/artifacts/pyfunc_meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"backend_type": "arabert-lora"}
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/conda.yaml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ channels:
2
+ - conda-forge
3
+ dependencies:
4
+ - python=3.12.8
5
+ - pip
6
+ - pip:
7
+ - mlflow==3.12.0
8
+ - annotated-doc==0.0.4
9
+ - annotated-types==0.7.0
10
+ - anyio==4.13.0
11
+ - click==8.4.0
12
+ - cloudpickle==3.1.2
13
+ - colorama==0.4.6; sys_platform == "win32"
14
+ - fastapi==0.136.1
15
+ - h11==0.16.0
16
+ - httptools==0.7.1
17
+ - idna==3.15
18
+ - pydantic-core==2.46.4
19
+ - pydantic==2.13.4
20
+ - python-dotenv==1.2.2
21
+ - pyyaml==6.0.3
22
+ - starlette==0.52.1
23
+ - typing-extensions==4.15.0
24
+ - typing-inspection==0.4.2
25
+ - uvicorn==0.47.0
26
+ - uvloop==0.22.1; platform_python_implementation != "PyPy" and sys_platform != "cygwin"
27
+ and sys_platform != "win32"
28
+ - watchfiles==1.2.0
29
+ - websockets==16.0
30
+ name: mlflow-env
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/input_example.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["text"], "data": [["\u0645\u0631\u062d\u0628\u0627"]]}
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/pyproject.toml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [project]
2
+ name = "arabic-sentiment-mlops"
3
+ version = "0.1.0"
4
+ requires-python = ">=3.12"
5
+ dependencies = [
6
+ "fastapi>=0.115",
7
+ "uvicorn[standard]>=0.30",
8
+ "pydantic>=2.7",
9
+ ]
10
+
11
+ [project.optional-dependencies]
12
+ ml = [
13
+ "transformers>=4.40",
14
+ "catboost>=1.2",
15
+ "scikit-learn>=1.5",
16
+ "mlflow>=2.14",
17
+ "torch>=2.3",
18
+ "datasets>=2.18",
19
+ "peft>=0.11",
20
+ "accelerate>=0.30",
21
+ "evaluate>=0.4",
22
+ ]
23
+ dev = [
24
+ "pytest>=8.2",
25
+ "pytest-cov>=5.0",
26
+ "httpx>=0.27",
27
+ "ruff>=0.4",
28
+ ]
29
+
30
+ [build-system]
31
+ requires = ["hatchling"]
32
+ build-backend = "hatchling.build"
33
+
34
+ [tool.hatch.build.targets.wheel]
35
+ packages = ["src/sentiment", "src/api"]
36
+
37
+ [tool.ruff]
38
+ line-length = 100
39
+ target-version = "py312"
40
+
41
+ [tool.ruff.lint]
42
+ select = ["E", "F", "I", "N", "UP"]
43
+
44
+ [tool.pytest.ini_options]
45
+ testpaths = ["tests"]
46
+ pythonpath = ["src"]
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/python_env.yaml ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ python: 3.12.8
2
+ build_dependencies:
3
+ - pip
4
+ - setuptools==81.0.0
5
+ - wheel
6
+ dependencies:
7
+ - -r requirements.txt
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/python_model.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d0b2a47bd17bef43bde1711327fcec21e5427d2d19f96ceb96afec73431bb53
3
+ size 544321244
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/registered_model_meta ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ model_name: arabert-lora
2
+ model_version: '1'
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/requirements.txt ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ mlflow==3.12.0
2
+ annotated-doc==0.0.4
3
+ annotated-types==0.7.0
4
+ anyio==4.13.0
5
+ click==8.4.0
6
+ cloudpickle==3.1.2
7
+ colorama==0.4.6; sys_platform == "win32"
8
+ fastapi==0.136.1
9
+ h11==0.16.0
10
+ httptools==0.7.1
11
+ idna==3.15
12
+ pydantic-core==2.46.4
13
+ pydantic==2.13.4
14
+ python-dotenv==1.2.2
15
+ pyyaml==6.0.3
16
+ starlette==0.52.1
17
+ typing-extensions==4.15.0
18
+ typing-inspection==0.4.2
19
+ uvicorn==0.47.0
20
+ uvloop==0.22.1; platform_python_implementation != "PyPy" and sys_platform != "cygwin" and sys_platform != "win32"
21
+ watchfiles==1.2.0
22
+ websockets==16.0
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/serving_input_example.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataframe_split": {
3
+ "columns": [
4
+ "text"
5
+ ],
6
+ "data": [
7
+ [
8
+ "\u0645\u0631\u062d\u0628\u0627"
9
+ ]
10
+ ]
11
+ }
12
+ }
mlruns/1/models/m-f9cac40424504a5a91d9449f38f5bd7c/artifacts/uv.lock ADDED
The diff for this file is too large to render. See raw diff