Update after integration (#17)

Files changed (6) hide show

config.json CHANGED Viewed

@@ -82,8 +82,8 @@
     "bos_token_id": null,
     "chunk_size_feed_forward": 0,
     "cross_attention_hidden_size": null,
-    "d_ff": 3968,
-    "d_kv": 64,
     "decoder_start_token_id": null,
     "dense_act_fn": "gelu_new",
     "diversity_penalty": 0.0,
@@ -133,7 +133,7 @@
     "return_dict": true,
     "return_dict_in_generate": false,
     "sep_token_id": null,
-    "seq_len": 4096,
     "suppress_tokens": null,
     "task_specific_params": null,
     "temperature": 1.0,

     "bos_token_id": null,
     "chunk_size_feed_forward": 0,
     "cross_attention_hidden_size": null,
+    "intermediate_size": 3968,
+    "head_dim": 64,
     "decoder_start_token_id": null,
     "dense_act_fn": "gelu_new",
     "diversity_penalty": 0.0,
     "return_dict": true,
     "return_dict_in_generate": false,
     "sep_token_id": null,
+    "max_num_patches": 4096,
     "suppress_tokens": null,
     "task_specific_params": null,
     "temperature": 1.0,

md.py CHANGED Viewed

@@ -11,7 +11,7 @@ model = Kosmos2_5ForConditionalGeneration.from_pretrained(repo, device_map=devic
 processor = AutoProcessor.from_pretrained(repo)
 # sample image
-url = "https://huggingface.co/microsoft/kosmos-2.5/blob/main/receipt_00008.png"
 image = Image.open(requests.get(url, stream=True).raw)
 prompt = "<md>"
@@ -30,4 +30,4 @@ generated_ids = model.generate(
 )
 generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)
-print(generated_text[0])

 processor = AutoProcessor.from_pretrained(repo)
 # sample image
+url = "https://huggingface.co/microsoft/kosmos-2.5/resolve/main/receipt_00008.png"
 image = Image.open(requests.get(url, stream=True).raw)
 prompt = "<md>"
 )
 generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)
+print(generated_text[0])

ocr.py CHANGED Viewed

@@ -11,7 +11,7 @@ model = Kosmos2_5ForConditionalGeneration.from_pretrained(repo, device_map=devic
 processor = AutoProcessor.from_pretrained(repo)
 # sample image
-url = "https://huggingface.co/microsoft/kosmos-2.5/blob/main/receipt_00008.png"
 image = Image.open(requests.get(url, stream=True).raw)
 # bs = 1
@@ -70,4 +70,4 @@ for line in lines:
         continue
     line = list(map(int, line[:8]))
     draw.polygon(line, outline="red")
-image.save("output.png")

 processor = AutoProcessor.from_pretrained(repo)
 # sample image
+url = "https://huggingface.co/microsoft/kosmos-2.5/resolve/main/receipt_00008.png"
 image = Image.open(requests.get(url, stream=True).raw)
 # bs = 1
         continue
     line = list(map(int, line[:8]))
     draw.polygon(line, outline="red")
+image.save("output.png")

special_tokens_map.json ADDED Viewed

+{
+  "boi_token": "<image>",
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eoi_token": "</image>",
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "image_token": "<s>",
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

The diff for this file is too large to render. See raw diff