Upload 10 files

Browse files

Files changed (6) hide show

.gitattributes +35 -35
README.md +121 -121
config.json +6 -6
model.safetensors +1 -1
optimizer_scheduler_state.pt +1 -1
training_args.bin +1 -1

.gitattributes CHANGED Viewed

@@ -1,35 +1,35 @@
-*.7z filter=lfs diff=lfs merge=lfs -text
-*.arrow filter=lfs diff=lfs merge=lfs -text
-*.bin filter=lfs diff=lfs merge=lfs -text
-*.bz2 filter=lfs diff=lfs merge=lfs -text
-*.ckpt filter=lfs diff=lfs merge=lfs -text
-*.ftz filter=lfs diff=lfs merge=lfs -text
-*.gz filter=lfs diff=lfs merge=lfs -text
-*.h5 filter=lfs diff=lfs merge=lfs -text
-*.joblib filter=lfs diff=lfs merge=lfs -text
-*.lfs.* filter=lfs diff=lfs merge=lfs -text
-*.mlmodel filter=lfs diff=lfs merge=lfs -text
-*.model filter=lfs diff=lfs merge=lfs -text
-*.msgpack filter=lfs diff=lfs merge=lfs -text
-*.npy filter=lfs diff=lfs merge=lfs -text
-*.npz filter=lfs diff=lfs merge=lfs -text
-*.onnx filter=lfs diff=lfs merge=lfs -text
-*.ot filter=lfs diff=lfs merge=lfs -text
-*.parquet filter=lfs diff=lfs merge=lfs -text
-*.pb filter=lfs diff=lfs merge=lfs -text
-*.pickle filter=lfs diff=lfs merge=lfs -text
-*.pkl filter=lfs diff=lfs merge=lfs -text
-*.pt filter=lfs diff=lfs merge=lfs -text
-*.pth filter=lfs diff=lfs merge=lfs -text
-*.rar filter=lfs diff=lfs merge=lfs -text
-*.safetensors filter=lfs diff=lfs merge=lfs -text
-saved_model/**/* filter=lfs diff=lfs merge=lfs -text
-*.tar.* filter=lfs diff=lfs merge=lfs -text
-*.tar filter=lfs diff=lfs merge=lfs -text
-*.tflite filter=lfs diff=lfs merge=lfs -text
-*.tgz filter=lfs diff=lfs merge=lfs -text
-*.wasm filter=lfs diff=lfs merge=lfs -text
-*.xz filter=lfs diff=lfs merge=lfs -text
-*.zip filter=lfs diff=lfs merge=lfs -text
-*.zst filter=lfs diff=lfs merge=lfs -text
-*tfevents* filter=lfs diff=lfs merge=lfs -text

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,121 +1,121 @@
----
-license: cc-by-nc-nd-4.0
-language:
-- en
-model-index:
-  - name: roberta-large Image Prompt Classifier
-    results:
-      - task:
-          type: text-classification
-        dataset:
-          name: nsfw-text-detection
-          type: custom
-        metrics:
-          - name: Accuracy
-            type: self-reported
-            value: 93%
-          - name: Precision
-            type: self-reported
-            value: 88%
-          - name: Recall
-            type: self-reported
-            value: 90%
----
-# roberta-large Image Prompt Classifier
-## Model Overview
-This model is a fine-tuned version of `roberta-large` designed specifically for classifying image generation prompts into three distinct categories: SAFE, QUESTIONABLE, and UNSAFE. Leveraging the robust capabilities of the `roberta-large` architecture, this model ensures high accuracy and reliability in identifying the nature of prompts used for generating images.
-## Model Details
-- **Model Name:** roberta-large Image Prompt Classifier
-- **Base Model:** [roberta-large](https://huggingface.co/roberta-large)
-- **Fine-tuned By:** Michał Młodawski
-- **Categories:**
-  - `0`: SAFE
-  - `1`: QUESTIONABLE
-  - `2`: UNSAFE
-## Use Cases
-This model is particularly useful for platforms and applications involving AI-generated content, where it is crucial to filter and classify prompts to maintain content safety and appropriateness. Some potential applications include:
-- **Content Moderation:** Automatically classify and filter prompts to prevent the generation of inappropriate or harmful images.
-- **User Safety:** Enhance user experience by ensuring that generated content adheres to safety guidelines.
-- **Compliance:** Help platforms comply with regulatory requirements by identifying and flagging potentially unsafe prompts.
-## How It Works
-The model takes an input prompt and classifies it into one of three categories:
-1. **SAFE:** Prompts that are deemed appropriate and free from harmful content.
-2. **QUESTIONABLE:** Prompts that may require further review due to potential ambiguity or slight risk.
-3. **UNSAFE:** Prompts that are likely to generate inappropriate or harmful content.
-The classification is based on the semantic understanding and contextual analysis provided by the `roberta-large` architecture, fine-tuned on a curated dataset tailored for this specific task.
-## Performance
-Extensive testing and validation have been conducted to ensure the model's performance meets high standards of accuracy and reliability. Key metrics include:
-- **Accuracy:** 93%
-- **Precision:** 88%
-- **Recall:** 90%
-These metrics highlight the model's capability to effectively distinguish between different categories of prompts with high confidence.
-## Getting Started
-To start using the roberta-large Image Prompt Classifier, you can easily integrate it into your existing workflows with the following steps:
-### Installation
-    pip install transformers==4.37.2
-    pip install torch==2.3.1
-### Usage
-    import os
-    from transformers import AutoTokenizer, AutoModelForSequenceClassification
-    import torch
-    model_repo = "MichalMlodawski/nsfw-text-detection-large"
-    tokenizer = AutoTokenizer.from_pretrained(model_path)
-    model = AutoModelForSequenceClassification.from_pretrained(model_path)
-    def classify_text(text):
-        inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True, max_length=512)
-        with torch.no_grad():
-            outputs = model(**inputs)
-        logits = outputs.logits
-        predicted_class = torch.argmax(logits, dim=1).item()
-        return predicted_class
-    if __name__ == "__main__":
-        examples = [
-            {"text": "wild west cowboy caravan through Arizona Desert , Men Woman and children, horse drawn carriages", "expected_class": 0},
-            {"text": "A person with questionable intentions in a dimly lit alley.", "expected_class": 1},
-            {"text": "An inappropriate scene involving explicit content.", "expected_class": 2}
-        ]
-        for example in examples:
-            text = example["text"]
-            expected_class = example["expected_class"]
-            predicted_class = classify_text(text)
-            print(f"Prompt: {text}")
-            print(f"Predicted class: {predicted_class}")
-            print(f"Expected class: {expected_class}")
-            print("---")
-### Disclaimer
-The dataset includes actual prompts for image generation that could be perceived as abusive, offensive, or obscene. Furthermore, the examples and data might contain unfavorable information about certain businesses. We merely collect this data and do not assume any legal responsibility.
-Please note: A portion of the data was created using Large Language Models (LLM).

+---
+license: cc-by-nc-nd-4.0
+language:
+- en
+model-index:
+  - name: roberta-large Image Prompt Classifier
+    results:
+      - task:
+          type: text-classification
+        dataset:
+          name: nsfw-text-detection
+          type: custom
+        metrics:
+          - name: Accuracy
+            type: self-reported
+            value: 93%
+          - name: Precision
+            type: self-reported
+            value: 88%
+          - name: Recall
+            type: self-reported
+            value: 90%
+---
+# roberta-large Image Prompt Classifier
+## Model Overview
+This model is a fine-tuned version of `roberta-large` designed specifically for classifying image generation prompts into three distinct categories: SAFE, QUESTIONABLE, and UNSAFE. Leveraging the robust capabilities of the `roberta-large` architecture, this model ensures high accuracy and reliability in identifying the nature of prompts used for generating images.
+## Model Details
+- **Model Name:** roberta-large Image Prompt Classifier
+- **Base Model:** [roberta-large](https://huggingface.co/roberta-large)
+- **Fine-tuned By:** Michał Młodawski
+- **Categories:**
+  - `0`: SAFE
+  - `1`: QUESTIONABLE
+  - `2`: UNSAFE
+## Use Cases
+This model is particularly useful for platforms and applications involving AI-generated content, where it is crucial to filter and classify prompts to maintain content safety and appropriateness. Some potential applications include:
+- **Content Moderation:** Automatically classify and filter prompts to prevent the generation of inappropriate or harmful images.
+- **User Safety:** Enhance user experience by ensuring that generated content adheres to safety guidelines.
+- **Compliance:** Help platforms comply with regulatory requirements by identifying and flagging potentially unsafe prompts.
+## How It Works
+The model takes an input prompt and classifies it into one of three categories:
+1. **SAFE:** Prompts that are deemed appropriate and free from harmful content.
+2. **QUESTIONABLE:** Prompts that may require further review due to potential ambiguity or slight risk.
+3. **UNSAFE:** Prompts that are likely to generate inappropriate or harmful content.
+The classification is based on the semantic understanding and contextual analysis provided by the `roberta-large` architecture, fine-tuned on a curated dataset tailored for this specific task.
+## Performance
+Extensive testing and validation have been conducted to ensure the model's performance meets high standards of accuracy and reliability. Key metrics include:
+- **Accuracy:** 93%
+- **Precision:** 88%
+- **Recall:** 90%
+These metrics highlight the model's capability to effectively distinguish between different categories of prompts with high confidence.
+## Getting Started
+To start using the roberta-large Image Prompt Classifier, you can easily integrate it into your existing workflows with the following steps:
+### Installation
+    pip install transformers==4.37.2
+    pip install torch==2.3.1
+### Usage
+    import os
+    from transformers import AutoTokenizer, AutoModelForSequenceClassification
+    import torch
+    model_repo = "MichalMlodawski/nsfw-text-detection-large"
+    tokenizer = AutoTokenizer.from_pretrained(model_path)
+    model = AutoModelForSequenceClassification.from_pretrained(model_path)
+    def classify_text(text):
+        inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True, max_length=512)
+        with torch.no_grad():
+            outputs = model(**inputs)
+        logits = outputs.logits
+        predicted_class = torch.argmax(logits, dim=1).item()
+        return predicted_class
+    if __name__ == "__main__":
+        examples = [
+            {"text": "wild west cowboy caravan through Arizona Desert , Men Woman and children, horse drawn carriages", "expected_class": 0},
+            {"text": "A person with questionable intentions in a dimly lit alley.", "expected_class": 1},
+            {"text": "An inappropriate scene involving explicit content.", "expected_class": 2}
+        ]
+        for example in examples:
+            text = example["text"]
+            expected_class = example["expected_class"]
+            predicted_class = classify_text(text)
+            print(f"Prompt: {text}")
+            print(f"Predicted class: {predicted_class}")
+            print(f"Expected class: {expected_class}")
+            print("---")
+### Disclaimer
+The dataset includes actual prompts for image generation that could be perceived as abusive, offensive, or obscene. Furthermore, the examples and data might contain unfavorable information about certain businesses. We merely collect this data and do not assume any legal responsibility.
+Please note: A portion of the data was created using Large Language Models (LLM).

config.json CHANGED Viewed

@@ -11,16 +11,16 @@
   "hidden_dropout_prob": 0.1,
   "hidden_size": 1024,
   "id2label": {
-    "0": "SAFE",
-    "1": "QUESTIONABLE",
-    "2": "UNSAFE"
   },
   "initializer_range": 0.02,
   "intermediate_size": 4096,
   "label2id": {
-    "SAFE": 0,
-    "QUESTIONABLE": 1,
-    "UNSAFE": 2
   },
   "layer_norm_eps": 1e-05,
   "max_position_embeddings": 514,

   "hidden_dropout_prob": 0.1,
   "hidden_size": 1024,
   "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
   },
   "initializer_range": 0.02,
   "intermediate_size": 4096,
   "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
   },
   "layer_norm_eps": 1e-05,
   "max_position_embeddings": 514,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ea8f0e9da471e19fa58ef0310a680708a0f63089e17886604ba0c20528df6c0
 size 1421499516

 version https://git-lfs.github.com/spec/v1
+oid sha256:e6412737d149c0b28e5d1fb106b20dae7efc371a952bced0ef573095d54653a4
 size 1421499516

optimizer_scheduler_state.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28311a8ef05854ed704749bf68a9f6279875692a2b488725afab26fb70a886a6
 size 2843250589

 version https://git-lfs.github.com/spec/v1
+oid sha256:4353e043721a02ce4857a40bbfbfd05b98d3b756ff1b6f3ba873bbcd6b31bc8b
 size 2843250589

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77769e09e9c4ebbc63535129bf21c72d6b5c6920c5791de5052edc9787f9fc48
 size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:e6910f30f1620141f6f53c1d666baddaf2d4f9deded6048915534d87935996e3
 size 4664