-
Notifications
You must be signed in to change notification settings - Fork 13
Expand file tree
/
Copy pathexample.py
More file actions
87 lines (76 loc) · 2.45 KB
/
example.py
File metadata and controls
87 lines (76 loc) · 2.45 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
import argparse
import json
import torch
from sensenova_si import get_model
def set_seed(seed=42):
torch.manual_seed(seed)
if torch.cuda.is_available():
torch.cuda.manual_seed(seed)
torch.cuda.manual_seed_all(seed)
if __name__ == "__main__":
set_seed()
parser = argparse.ArgumentParser(
description="Examples for SenseNova-SI single-run MCQ"
)
parser.add_argument(
"--model_path",
type=str,
default="sensenova/SenseNova-SI-1.3-InternVL3-8B",
help="Model path",
)
parser.add_argument(
"--image_paths",
type=str,
nargs="+",
default=[],
help="Path to image files, can specify multiple",
)
parser.add_argument(
"--question",
type=str,
default="Please describe the image in detail.",
help="Question to ask the model",
)
parser.add_argument(
"--jsonl_path",
type=str,
default=None,
help="Path to jsonl file containing examples",
)
parser.add_argument(
"--model_type",
type=str,
default="auto",
choices=["qwen", "internvl", "auto"],
help="Model type",
)
args = parser.parse_args()
model_path = args.model_path
print(f"Model path: {model_path}")
model = get_model(model_path, model_type=args.model_type)
if args.jsonl_path:
with open(args.jsonl_path, "r") as f:
for line in f:
entry = json.loads(line.strip())
image_paths = entry.get("image", [])
conversations = entry.get("conversations", [])
if conversations:
question = conversations[0].get("value", "")
else:
question = ""
id_ = entry.get("id", "")
gt = entry.get("GT", "")
if not image_paths or not question:
print(f"Skipping invalid entry id {id_}")
continue
print(f"Processing question id: {id_}")
response = model.generate(question, images=image_paths)
print(f"User: {question}")
print(f"Assistant: {response}")
print(f"Ground Truth: {gt}")
print("-" * 50)
else:
question = args.question
response = model.generate(question, images=args.image_paths)
print(f"User: {question}")
print(f"Assistant: {response}")