lfs

Files changed (10) hide show

app.py CHANGED Viewed

@@ -6,7 +6,7 @@ from transformers import CLIPProcessor, CLIPModel, pipeline, BlipProcessor, Blip
 model = CLIPModel.from_pretrained("model")
 processor = CLIPProcessor.from_pretrained("tokenizer")
-vqa_pipeline = pipeline("visual-question-answering")
 space_type_labels = ["living room", "bedroom", "kitchen", "terrace", "closet","bathroom", "dining room", "office", "garage", "garden",
     "balcony", "attic", "hallway", "laundry room","gym", "playroom", "storage room", "studio","is_exterior","empty_interior_room","swimming pool"]

 model = CLIPModel.from_pretrained("model")
 processor = CLIPProcessor.from_pretrained("tokenizer")
+vqa_pipeline = pipeline("visual-question-answering",model="vqa")
 space_type_labels = ["living room", "bedroom", "kitchen", "terrace", "closet","bathroom", "dining room", "office", "garage", "garden",
     "balcony", "attic", "hallway", "laundry room","gym", "playroom", "storage room", "studio","is_exterior","empty_interior_room","swimming pool"]

model/config.json ADDED Viewed

+{
+  "_name_or_path": "openai/clip-vit-base-patch32",
+  "architectures": [
+    "CLIPModel"
+  ],
+  "initializer_factor": 1.0,
+  "logit_scale_init_value": 2.6592,
+  "model_type": "clip",
+  "projection_dim": 512,
+  "text_config": {
+    "bos_token_id": 0,
+    "dropout": 0.0,
+    "eos_token_id": 2,
+    "model_type": "clip_text_model"
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.37.1",
+  "vision_config": {
+    "dropout": 0.0,
+    "model_type": "clip_vision_model"
+  }
+}

vqa/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

vqa/config.json ADDED Viewed

The diff for this file is too large to render. See raw diff

vqa/model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a1fef76c03050f1d7cc7fff64a46fc56a8c6ea48f924cc1922b3aa1e32121e1
+size 470378972

vqa/preprocessor_config.json ADDED Viewed

+{
+  "do_normalize": true,
+  "do_pad": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "image_processor_type": "ViltImageProcessor",
+  "image_std": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "shortest_edge": 384
+  },
+  "size_divisor": 32
+}

vqa/special_tokens_map.json ADDED Viewed

+{
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

vqa/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

vqa/tokenizer_config.json ADDED Viewed

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 40,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

vqa/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff