UltraDoughnut commited on Oct 9, 2025

Commit

c206437

verified ·

1 Parent(s): 81b77f6

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

lisa-ivl3-2b_bi2cbe_aati_srm/ckpt_model/config.json +143 -0
lisa-ivl3-2b_bi2cbe_aati_srm/ckpt_model/model.safetensors +3 -0
lisa-ivl3-2b_bi2cbe_aati_srm/ckpt_model/training_args.bin +3 -0
lisa-ivl3-2b_bi2cbe_aati_srm/evaluation_metrics.json +116 -0
lisa-ivl3-2b_bi2cbe_aati_srm/events.out.tfevents.1758303972.bask-pg0308u25a.2176098.0 +3 -0
lisa-ivl3-2b_bi2cbe_aati_srm/events.out.tfevents.1758304185.bask-pg0308u25a.2184107.0 +3 -0
lisa-ivl3-2b_bi2cbe_aati_srm/runs/Sep19_18-46-08_bask-pg0308u25a/events.out.tfevents.1758304037.bask-pg0308u25a.2176098.1 +3 -0
lisa-ivl3-2b_bi2cbe_aati_srm/runs/Sep19_18-49-42_bask-pg0308u25a/events.out.tfevents.1758304237.bask-pg0308u25a.2184107.1 +3 -0
lisa-ivl3-2b_bi2cbe_aati_srm/runs/Sep19_18-49-42_bask-pg0308u25a/events.out.tfevents.1758339214.bask-pg0308u25a.2184107.2 +3 -0
lisa-ivl3-2b_bi2cbe_aati_srs/ckpt_model/config.json +143 -0
lisa-ivl3-2b_bi2cbe_aati_srs/ckpt_model/model.safetensors +3 -0
lisa-ivl3-2b_bi2cbe_aati_srs/ckpt_model/training_args.bin +3 -0
lisa-ivl3-2b_bi2cbe_aati_srs/evaluation_metrics.json +116 -0
lisa-ivl3-2b_bi2cbe_aati_srs/events.out.tfevents.1758407218.bask-pg0308u25a.3988218.0 +3 -0
lisa-ivl3-2b_bi2cbe_aati_srs/runs/Sep20_23-26-55_bask-pg0308u25a/events.out.tfevents.1758407268.bask-pg0308u25a.3988218.1 +3 -0
lisa-ivl3-2b_bi2cbe_aati_srs/runs/Sep20_23-26-55_bask-pg0308u25a/events.out.tfevents.1758441983.bask-pg0308u25a.3988218.2 +3 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/ckpt_model/config.json +143 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/ckpt_model/model.safetensors +3 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/ckpt_model/training_args.bin +3 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/evaluation_metrics.json +116 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/events.out.tfevents.1758822942.bask-pg0308u25a.3977024.0 +3 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/events.out.tfevents.1758823030.bask-pg0308u25a.3998347.0 +3 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/runs/Sep25_18-57-07_bask-pg0308u25a/events.out.tfevents.1758823107.bask-pg0308u25a.3998347.1 +3 -0
lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/runs/Sep25_18-57-07_bask-pg0308u25a/events.out.tfevents.1758870402.bask-pg0308u25a.3998347.2 +3 -0
lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/ckpt_model/config.json +143 -0
lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/ckpt_model/model.safetensors +3 -0
lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/ckpt_model/training_args.bin +3 -0
lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/evaluation_metrics.json +116 -0
lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/events.out.tfevents.1758558655.bask-pg0308u29a.637997.0 +3 -0
lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/runs/Sep22_17-30-52_bask-pg0308u29a/events.out.tfevents.1758558731.bask-pg0308u29a.637997.1 +3 -0
lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/runs/Sep22_17-30-52_bask-pg0308u29a/events.out.tfevents.1758608704.bask-pg0308u29a.637997.2 +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/ckpt_model/config.json +143 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/ckpt_model/model.safetensors +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/ckpt_model/training_args.bin +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/evaluation_metrics.json +116 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/events.out.tfevents.1758821654.bask-pg0308u18a.998112.0 +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/events.out.tfevents.1758821976.bask-pg0308u18a.1004472.0 +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/events.out.tfevents.1758822179.bask-pg0308u18a.1008370.0 +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-34-12_bask-pg0308u18a/events.out.tfevents.1758821725.bask-pg0308u18a.998112.1 +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-39-34_bask-pg0308u18a/events.out.tfevents.1758822035.bask-pg0308u18a.1004472.1 +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-42-56_bask-pg0308u18a/events.out.tfevents.1758822240.bask-pg0308u18a.1008370.1 +3 -0
lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-42-56_bask-pg0308u18a/events.out.tfevents.1758869487.bask-pg0308u18a.1008370.2 +3 -0
lisa-ivl3-2b_bi2cbe_vlorati_coco/ckpt_model/config.json +143 -0
lisa-ivl3-2b_bi2cbe_vlorati_coco/ckpt_model/model.safetensors +3 -0
lisa-ivl3-2b_bi2cbe_vlorati_coco/ckpt_model/training_args.bin +3 -0
lisa-ivl3-2b_bi2cbe_vlorati_coco/evaluation_metrics.json +116 -0
lisa-ivl3-2b_bi2cbe_vlorati_coco/events.out.tfevents.1758236140.bask-pg0309u16a.1220041.0 +3 -0
lisa-ivl3-2b_bi2cbe_vlorati_coco/runs/Sep18_23-55-37_bask-pg0309u16a/events.out.tfevents.1758236201.bask-pg0309u16a.1220041.1 +3 -0
lisa-ivl3-2b_bi2cbe_vlorati_coco/runs/Sep18_23-55-37_bask-pg0309u16a/events.out.tfevents.1758283609.bask-pg0309u16a.1220041.2 +3 -0
lisa-ivl3-2b_bi2cbe_vlorati_sr/ckpt_model/config.json +143 -0

lisa-ivl3-2b_bi2cbe_aati_srm/ckpt_model/config.json ADDED Viewed

	@@ -0,0 +1,143 @@

+{
+  "architectures": [
+    "InternVL3Self"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_internvl_chat.InternVLChatConfig",
+    "AutoModel": "modeling_internvl_chat.InternVLChatModel",
+    "AutoModelForCausalLM": "modeling_internvl_chat.InternVLChatModel"
+  },
+  "downsample_ratio": 0.5,
+  "dtype": "bfloat16",
+  "dynamic_image_size": true,
+  "eos_token_id": 151645,
+  "force_image_size": 448,
+  "hidden_size": 1536,
+  "image_fold": null,
+  "llm_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "./pretrained/Qwen2.5-32B-Instruct",
+    "architectures": [
+      "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "dtype": "bfloat16",
+    "eos_token_id": 151643,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 70,
+    "model_type": "qwen2",
+    "moe_config": null,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "factor": 2.0,
+      "rope_type": "dynamic",
+      "type": "dynamic"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "use_bfloat16": true,
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151676
+  },
+  "max_dynamic_patch": 12,
+  "min_dynamic_patch": 1,
+  "model_type": "internvl_chat",
+  "output_attentions": false,
+  "pad2square": false,
+  "pad_token_id": 151643,
+  "ps_version": "v2",
+  "select_layer": -1,
+  "system_message": null,
+  "template": "internvl2_5",
+  "tie_word_embeddings": false,
+  "transformers_version": null,
+  "use_backbone_lora": 0,
+  "use_llm_lora": 0,
+  "use_thumbnail": true,
+  "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "OpenGVLab/InternViT-6B-448px-V1-5",
+    "architectures": [
+      "InternVisionModel"
+    ],
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_intern_vit.InternVisionConfig",
+      "AutoModel": "modeling_intern_vit.InternVisionModel"
+    },
+    "capacity_factor": 1.2,
+    "drop_path_rate": 0.1,
+    "dropout": 0.0,
+    "dtype": "bfloat16",
+    "eval_capacity_factor": 1.4,
+    "hidden_act": "gelu",
+    "hidden_size": 1024,
+    "image_size": 448,
+    "initializer_factor": 0.1,
+    "initializer_range": 1e-10,
+    "intermediate_size": 4096,
+    "laux_allreduce": "all_nodes",
+    "layer_norm_eps": 1e-06,
+    "model_type": "intern_vit_6b",
+    "moe_coeff_ratio": 0.5,
+    "moe_intermediate_size": 768,
+    "moe_output_scale": 4.0,
+    "noisy_gate_policy": "RSample_before",
+    "norm_type": "layer_norm",
+    "num_attention_heads": 16,
+    "num_channels": 3,
+    "num_experts": 8,
+    "num_hidden_layers": 24,
+    "num_routed_experts": 4,
+    "num_shared_experts": 4,
+    "patch_size": 14,
+    "qk_normalization": false,
+    "qkv_bias": true,
+    "shared_expert_intermediate_size": 3072,
+    "use_bfloat16": true,
+    "use_flash_attn": true,
+    "use_moe": false,
+    "use_residual": true,
+    "use_rts": false,
+    "use_weighted_residual": false
+  }
+}

lisa-ivl3-2b_bi2cbe_aati_srm/ckpt_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f3befb636a4bfdc7f407e8ec01f5b84a2869952dea6106070ab00f7d6b760ef
+size 4211070232

lisa-ivl3-2b_bi2cbe_aati_srm/ckpt_model/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:240c4be74f4b416addef8e472ffd17a8f0a9206792bbe14eb3617a6736ec132e
+size 7352

lisa-ivl3-2b_bi2cbe_aati_srm/evaluation_metrics.json ADDED Viewed

	@@ -0,0 +1,116 @@

+[
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 1.0,
+        "eval_giou": 0.528189480304718,
+        "eval_ciou": 0.6158800721168518
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 2.0,
+        "eval_giou": 0.57504802942276,
+        "eval_ciou": 0.6519048810005188
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 3.0,
+        "eval_giou": 0.5494521856307983,
+        "eval_ciou": 0.6140078902244568
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 4.0,
+        "eval_giou": 0.5751751065254211,
+        "eval_ciou": 0.6430273652076721
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 5.0,
+        "eval_giou": 0.5621751546859741,
+        "eval_ciou": 0.6091215014457703
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 6.0,
+        "eval_giou": 0.5681710243225098,
+        "eval_ciou": 0.5827724933624268
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 7.0,
+        "eval_giou": 0.5692390203475952,
+        "eval_ciou": 0.5854980945587158
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 8.0,
+        "eval_giou": 0.5853511095046997,
+        "eval_ciou": 0.5549483895301819
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 9.0,
+        "eval_giou": 0.5778804421424866,
+        "eval_ciou": 0.5894233584403992
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 10.0,
+        "eval_giou": 0.5841119885444641,
+        "eval_ciou": 0.5798441171646118
+    },
+    {
+        "val_dataset": "ReasonSeg|test",
+        "epoch": 10.0,
+        "eval_giou": 0.6100905537605286,
+        "eval_ciou": 0.6119125485420227
+    },
+    {
+        "val_dataset": "refcoco|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.799595832824707,
+        "eval_ciou": 0.8027365207672119
+    },
+    {
+        "val_dataset": "refcoco|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.8168815970420837,
+        "eval_ciou": 0.8243600130081177
+    },
+    {
+        "val_dataset": "refcoco|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.7745703458786011,
+        "eval_ciou": 0.7807985544204712
+    },
+    {
+        "val_dataset": "refcoco+|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7551393508911133,
+        "eval_ciou": 0.7453246712684631
+    },
+    {
+        "val_dataset": "refcoco+|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.7942529916763306,
+        "eval_ciou": 0.7944912910461426
+    },
+    {
+        "val_dataset": "refcoco+|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.7106485366821289,
+        "eval_ciou": 0.6990127563476562
+    },
+    {
+        "val_dataset": "refcocog|umd|test",
+        "epoch": 10.0,
+        "eval_giou": 0.7611709833145142,
+        "eval_ciou": 0.7682604193687439
+    },
+    {
+        "val_dataset": "refcocog|umd|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7570181488990784,
+        "eval_ciou": 0.7642934918403625
+    }
+]

lisa-ivl3-2b_bi2cbe_aati_srm/events.out.tfevents.1758303972.bask-pg0308u25a.2176098.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fd0eb014901254de4a95eb71fc2571d348cabd50a57e396fb2c3d342a3d7fb9
+size 486

lisa-ivl3-2b_bi2cbe_aati_srm/events.out.tfevents.1758304185.bask-pg0308u25a.2184107.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1af39459ef2a226054ba8d41e28d9351e1edf097f258d661335b41ebe8f3adc
+size 212352

lisa-ivl3-2b_bi2cbe_aati_srm/runs/Sep19_18-46-08_bask-pg0308u25a/events.out.tfevents.1758304037.bask-pg0308u25a.2176098.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4044136eab8f6e9cbcae192b20ebf5e4ed93ba0420ebf5e87c4b2238109fa4e
+size 9325

lisa-ivl3-2b_bi2cbe_aati_srm/runs/Sep19_18-49-42_bask-pg0308u25a/events.out.tfevents.1758304237.bask-pg0308u25a.2184107.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94cc218abf38e00bc41bdedd1db488f808895ac0ae3c3898e84ea6a04bec0e07
+size 116381

lisa-ivl3-2b_bi2cbe_aati_srm/runs/Sep19_18-49-42_bask-pg0308u25a/events.out.tfevents.1758339214.bask-pg0308u25a.2184107.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c63060c4d02dcdbdc52b17a6208816f1c9a7a952fd8d4159426ee935d22b9aad
+size 1402

lisa-ivl3-2b_bi2cbe_aati_srs/ckpt_model/config.json ADDED Viewed

	@@ -0,0 +1,143 @@

+{
+  "architectures": [
+    "InternVL3Self"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_internvl_chat.InternVLChatConfig",
+    "AutoModel": "modeling_internvl_chat.InternVLChatModel",
+    "AutoModelForCausalLM": "modeling_internvl_chat.InternVLChatModel"
+  },
+  "downsample_ratio": 0.5,
+  "dtype": "bfloat16",
+  "dynamic_image_size": true,
+  "eos_token_id": 151645,
+  "force_image_size": 448,
+  "hidden_size": 1536,
+  "image_fold": null,
+  "llm_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "./pretrained/Qwen2.5-32B-Instruct",
+    "architectures": [
+      "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "dtype": "bfloat16",
+    "eos_token_id": 151643,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 70,
+    "model_type": "qwen2",
+    "moe_config": null,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "factor": 2.0,
+      "rope_type": "dynamic",
+      "type": "dynamic"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "use_bfloat16": true,
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151676
+  },
+  "max_dynamic_patch": 12,
+  "min_dynamic_patch": 1,
+  "model_type": "internvl_chat",
+  "output_attentions": false,
+  "pad2square": false,
+  "pad_token_id": 151643,
+  "ps_version": "v2",
+  "select_layer": -1,
+  "system_message": null,
+  "template": "internvl2_5",
+  "tie_word_embeddings": false,
+  "transformers_version": null,
+  "use_backbone_lora": 0,
+  "use_llm_lora": 0,
+  "use_thumbnail": true,
+  "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "OpenGVLab/InternViT-6B-448px-V1-5",
+    "architectures": [
+      "InternVisionModel"
+    ],
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_intern_vit.InternVisionConfig",
+      "AutoModel": "modeling_intern_vit.InternVisionModel"
+    },
+    "capacity_factor": 1.2,
+    "drop_path_rate": 0.1,
+    "dropout": 0.0,
+    "dtype": "bfloat16",
+    "eval_capacity_factor": 1.4,
+    "hidden_act": "gelu",
+    "hidden_size": 1024,
+    "image_size": 448,
+    "initializer_factor": 0.1,
+    "initializer_range": 1e-10,
+    "intermediate_size": 4096,
+    "laux_allreduce": "all_nodes",
+    "layer_norm_eps": 1e-06,
+    "model_type": "intern_vit_6b",
+    "moe_coeff_ratio": 0.5,
+    "moe_intermediate_size": 768,
+    "moe_output_scale": 4.0,
+    "noisy_gate_policy": "RSample_before",
+    "norm_type": "layer_norm",
+    "num_attention_heads": 16,
+    "num_channels": 3,
+    "num_experts": 8,
+    "num_hidden_layers": 24,
+    "num_routed_experts": 4,
+    "num_shared_experts": 4,
+    "patch_size": 14,
+    "qk_normalization": false,
+    "qkv_bias": true,
+    "shared_expert_intermediate_size": 3072,
+    "use_bfloat16": true,
+    "use_flash_attn": true,
+    "use_moe": false,
+    "use_residual": true,
+    "use_rts": false,
+    "use_weighted_residual": false
+  }
+}

lisa-ivl3-2b_bi2cbe_aati_srs/ckpt_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e94e426c479692c600bd7da2a58a66d89b1a0b6105e5f4fba892bb35fa05130
+size 4211070232

lisa-ivl3-2b_bi2cbe_aati_srs/ckpt_model/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9efb840060edee20988b8e9bb354bde899f2bb93875da91a53a68a5e8259ceb3
+size 7352

lisa-ivl3-2b_bi2cbe_aati_srs/evaluation_metrics.json ADDED Viewed

	@@ -0,0 +1,116 @@

+[
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 1.0,
+        "eval_giou": 0.5235294699668884,
+        "eval_ciou": 0.5689558982849121
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 2.0,
+        "eval_giou": 0.4938444197177887,
+        "eval_ciou": 0.5315812826156616
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 3.0,
+        "eval_giou": 0.52805095911026,
+        "eval_ciou": 0.5778353810310364
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 4.0,
+        "eval_giou": 0.539726734161377,
+        "eval_ciou": 0.5628448128700256
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 5.0,
+        "eval_giou": 0.5516190528869629,
+        "eval_ciou": 0.5699143409729004
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 6.0,
+        "eval_giou": 0.5535993576049805,
+        "eval_ciou": 0.5486313700675964
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 7.0,
+        "eval_giou": 0.5771014094352722,
+        "eval_ciou": 0.630760908126831
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 8.0,
+        "eval_giou": 0.5713648796081543,
+        "eval_ciou": 0.5902009606361389
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 9.0,
+        "eval_giou": 0.566828727722168,
+        "eval_ciou": 0.5753384232521057
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 10.0,
+        "eval_giou": 0.5662292838096619,
+        "eval_ciou": 0.5734410285949707
+    },
+    {
+        "val_dataset": "ReasonSeg|test",
+        "epoch": 10.0,
+        "eval_giou": 0.5632049441337585,
+        "eval_ciou": 0.5677175521850586
+    },
+    {
+        "val_dataset": "refcoco|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.8058294057846069,
+        "eval_ciou": 0.810309886932373
+    },
+    {
+        "val_dataset": "refcoco|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.8246700167655945,
+        "eval_ciou": 0.8328030705451965
+    },
+    {
+        "val_dataset": "refcoco|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.7877973914146423,
+        "eval_ciou": 0.7934398651123047
+    },
+    {
+        "val_dataset": "refcoco+|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7641584277153015,
+        "eval_ciou": 0.7556021809577942
+    },
+    {
+        "val_dataset": "refcoco+|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.7998954057693481,
+        "eval_ciou": 0.7981683611869812
+    },
+    {
+        "val_dataset": "refcoco+|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.7219251394271851,
+        "eval_ciou": 0.7105168104171753
+    },
+    {
+        "val_dataset": "refcocog|umd|test",
+        "epoch": 10.0,
+        "eval_giou": 0.766793966293335,
+        "eval_ciou": 0.7789492011070251
+    },
+    {
+        "val_dataset": "refcocog|umd|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7627427577972412,
+        "eval_ciou": 0.7680707573890686
+    }
+]

lisa-ivl3-2b_bi2cbe_aati_srs/events.out.tfevents.1758407218.bask-pg0308u25a.3988218.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ceb9faddf368f10dc1f79077182ae3f0763d1d459cd00745aefdef29c4785740
+size 212352

lisa-ivl3-2b_bi2cbe_aati_srs/runs/Sep20_23-26-55_bask-pg0308u25a/events.out.tfevents.1758407268.bask-pg0308u25a.3988218.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c60008ebfd9d19da94c88abc8cbca2ad3850f341e6cd01437d6e2c1a16144b9
+size 116381

lisa-ivl3-2b_bi2cbe_aati_srs/runs/Sep20_23-26-55_bask-pg0308u25a/events.out.tfevents.1758441983.bask-pg0308u25a.3988218.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebda0e4e7c56eda12f89e0b655238dcdd19f18e497ae1d685d308e1e21d0b7dd
+size 1402

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/ckpt_model/config.json ADDED Viewed

	@@ -0,0 +1,143 @@

+{
+  "architectures": [
+    "InternVL3Self"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_internvl_chat.InternVLChatConfig",
+    "AutoModel": "modeling_internvl_chat.InternVLChatModel",
+    "AutoModelForCausalLM": "modeling_internvl_chat.InternVLChatModel"
+  },
+  "downsample_ratio": 0.5,
+  "dtype": "bfloat16",
+  "dynamic_image_size": true,
+  "eos_token_id": 151645,
+  "force_image_size": 448,
+  "hidden_size": 1536,
+  "image_fold": null,
+  "llm_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "./pretrained/Qwen2.5-32B-Instruct",
+    "architectures": [
+      "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "dtype": "bfloat16",
+    "eos_token_id": 151643,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 70,
+    "model_type": "qwen2",
+    "moe_config": null,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "factor": 2.0,
+      "rope_type": "dynamic",
+      "type": "dynamic"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "use_bfloat16": true,
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151676
+  },
+  "max_dynamic_patch": 12,
+  "min_dynamic_patch": 1,
+  "model_type": "internvl_chat",
+  "output_attentions": false,
+  "pad2square": false,
+  "pad_token_id": 151643,
+  "ps_version": "v2",
+  "select_layer": -1,
+  "system_message": null,
+  "template": "internvl2_5",
+  "tie_word_embeddings": false,
+  "transformers_version": null,
+  "use_backbone_lora": 0,
+  "use_llm_lora": 0,
+  "use_thumbnail": true,
+  "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "OpenGVLab/InternViT-6B-448px-V1-5",
+    "architectures": [
+      "InternVisionModel"
+    ],
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_intern_vit.InternVisionConfig",
+      "AutoModel": "modeling_intern_vit.InternVisionModel"
+    },
+    "capacity_factor": 1.2,
+    "drop_path_rate": 0.1,
+    "dropout": 0.0,
+    "dtype": "bfloat16",
+    "eval_capacity_factor": 1.4,
+    "hidden_act": "gelu",
+    "hidden_size": 1024,
+    "image_size": 448,
+    "initializer_factor": 0.1,
+    "initializer_range": 1e-10,
+    "intermediate_size": 4096,
+    "laux_allreduce": "all_nodes",
+    "layer_norm_eps": 1e-06,
+    "model_type": "intern_vit_6b",
+    "moe_coeff_ratio": 0.5,
+    "moe_intermediate_size": 768,
+    "moe_output_scale": 4.0,
+    "noisy_gate_policy": "RSample_before",
+    "norm_type": "layer_norm",
+    "num_attention_heads": 16,
+    "num_channels": 3,
+    "num_experts": 8,
+    "num_hidden_layers": 24,
+    "num_routed_experts": 4,
+    "num_shared_experts": 4,
+    "patch_size": 14,
+    "qk_normalization": false,
+    "qkv_bias": true,
+    "shared_expert_intermediate_size": 3072,
+    "use_bfloat16": true,
+    "use_flash_attn": true,
+    "use_moe": false,
+    "use_residual": true,
+    "use_rts": false,
+    "use_weighted_residual": false
+  }
+}

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/ckpt_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c525c1ae85c17caddcdb1b0d45df96d56a86227e4f990cbb36d7331a692551ad
+size 4211070232

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/ckpt_model/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7da9ac5d9ad0770700bf7b786cf18482fad5fd08e88a5e860bd99406ca19065d
+size 7352

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/evaluation_metrics.json ADDED Viewed

	@@ -0,0 +1,116 @@

+[
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 1.0,
+        "eval_giou": 0.4889245629310608,
+        "eval_ciou": 0.5533338189125061
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 2.0,
+        "eval_giou": 0.5513965487480164,
+        "eval_ciou": 0.6630034446716309
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 3.0,
+        "eval_giou": 0.5442399382591248,
+        "eval_ciou": 0.6376377940177917
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 4.0,
+        "eval_giou": 0.5748190879821777,
+        "eval_ciou": 0.6525793671607971
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 5.0,
+        "eval_giou": 0.5847772359848022,
+        "eval_ciou": 0.643996000289917
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 6.0,
+        "eval_giou": 0.5810279846191406,
+        "eval_ciou": 0.6454022526741028
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 7.0,
+        "eval_giou": 0.5949556827545166,
+        "eval_ciou": 0.6094688177108765
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 8.0,
+        "eval_giou": 0.6049715280532837,
+        "eval_ciou": 0.6379661560058594
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 9.0,
+        "eval_giou": 0.6034538149833679,
+        "eval_ciou": 0.6570442914962769
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 10.0,
+        "eval_giou": 0.6016661524772644,
+        "eval_ciou": 0.6353110671043396
+    },
+    {
+        "val_dataset": "ReasonSeg|test",
+        "epoch": 10.0,
+        "eval_giou": 0.6043070554733276,
+        "eval_ciou": 0.608022153377533
+    },
+    {
+        "val_dataset": "refcoco|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7902190089225769,
+        "eval_ciou": 0.7928427457809448
+    },
+    {
+        "val_dataset": "refcoco|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.807979166507721,
+        "eval_ciou": 0.8122658729553223
+    },
+    {
+        "val_dataset": "refcoco|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.763839066028595,
+        "eval_ciou": 0.764618992805481
+    },
+    {
+        "val_dataset": "refcoco+|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.738534688949585,
+        "eval_ciou": 0.7319899201393127
+    },
+    {
+        "val_dataset": "refcoco+|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.7776216864585876,
+        "eval_ciou": 0.7770327925682068
+    },
+    {
+        "val_dataset": "refcoco+|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.6900521516799927,
+        "eval_ciou": 0.676867663860321
+    },
+    {
+        "val_dataset": "refcocog|umd|test",
+        "epoch": 10.0,
+        "eval_giou": 0.7514216899871826,
+        "eval_ciou": 0.7589317560195923
+    },
+    {
+        "val_dataset": "refcocog|umd|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7455593943595886,
+        "eval_ciou": 0.7489427924156189
+    }
+]

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/events.out.tfevents.1758822942.bask-pg0308u25a.3977024.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5090ab4b5276a748931cd1068f50c6d17618a085656691fb72a03b346bd7b3b
+size 88

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/events.out.tfevents.1758823030.bask-pg0308u25a.3998347.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4aac91ef4c5538767282625b5123a14924a0f19f313d68d62ed42912194aebe6
+size 212352

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/runs/Sep25_18-57-07_bask-pg0308u25a/events.out.tfevents.1758823107.bask-pg0308u25a.3998347.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb225847cc5dc86b3ecdb0241d649d67245d9ca0710b65086da8f329c5700ee6
+size 116397

lisa-ivl3-2b_bi2cbe_ib_vlorati_sr/runs/Sep25_18-57-07_bask-pg0308u25a/events.out.tfevents.1758870402.bask-pg0308u25a.3998347.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0907be6c27349e6b811188c1c28862e763dfde6a47b69586b494273b0268d8f9
+size 1402

lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/ckpt_model/config.json ADDED Viewed

	@@ -0,0 +1,143 @@

+{
+  "architectures": [
+    "InternVL3Self"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_internvl_chat.InternVLChatConfig",
+    "AutoModel": "modeling_internvl_chat.InternVLChatModel",
+    "AutoModelForCausalLM": "modeling_internvl_chat.InternVLChatModel"
+  },
+  "downsample_ratio": 0.5,
+  "dtype": "bfloat16",
+  "dynamic_image_size": true,
+  "eos_token_id": 151645,
+  "force_image_size": 448,
+  "hidden_size": 1536,
+  "image_fold": null,
+  "llm_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "./pretrained/Qwen2.5-32B-Instruct",
+    "architectures": [
+      "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "dtype": "bfloat16",
+    "eos_token_id": 151643,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 70,
+    "model_type": "qwen2",
+    "moe_config": null,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "factor": 2.0,
+      "rope_type": "dynamic",
+      "type": "dynamic"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "use_bfloat16": true,
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151676
+  },
+  "max_dynamic_patch": 12,
+  "min_dynamic_patch": 1,
+  "model_type": "internvl_chat",
+  "output_attentions": false,
+  "pad2square": false,
+  "pad_token_id": 151643,
+  "ps_version": "v2",
+  "select_layer": -1,
+  "system_message": null,
+  "template": "internvl2_5",
+  "tie_word_embeddings": false,
+  "transformers_version": null,
+  "use_backbone_lora": 0,
+  "use_llm_lora": 0,
+  "use_thumbnail": true,
+  "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "OpenGVLab/InternViT-6B-448px-V1-5",
+    "architectures": [
+      "InternVisionModel"
+    ],
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_intern_vit.InternVisionConfig",
+      "AutoModel": "modeling_intern_vit.InternVisionModel"
+    },
+    "capacity_factor": 1.2,
+    "drop_path_rate": 0.1,
+    "dropout": 0.0,
+    "dtype": "bfloat16",
+    "eval_capacity_factor": 1.4,
+    "hidden_act": "gelu",
+    "hidden_size": 1024,
+    "image_size": 448,
+    "initializer_factor": 0.1,
+    "initializer_range": 1e-10,
+    "intermediate_size": 4096,
+    "laux_allreduce": "all_nodes",
+    "layer_norm_eps": 1e-06,
+    "model_type": "intern_vit_6b",
+    "moe_coeff_ratio": 0.5,
+    "moe_intermediate_size": 768,
+    "moe_output_scale": 4.0,
+    "noisy_gate_policy": "RSample_before",
+    "norm_type": "layer_norm",
+    "num_attention_heads": 16,
+    "num_channels": 3,
+    "num_experts": 8,
+    "num_hidden_layers": 24,
+    "num_routed_experts": 4,
+    "num_shared_experts": 4,
+    "patch_size": 14,
+    "qk_normalization": false,
+    "qkv_bias": true,
+    "shared_expert_intermediate_size": 3072,
+    "use_bfloat16": true,
+    "use_flash_attn": true,
+    "use_moe": false,
+    "use_residual": true,
+    "use_rts": false,
+    "use_weighted_residual": false
+  }
+}

lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/ckpt_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a9a73ee98332ed56252ee2690f1a7351446fd80c4253500657c9284e0a0f05fd
+size 4211070232

lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/ckpt_model/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:833f70825712e685e5ab69b01da135f496f6a901ba5bc7b958a93796e95e8a09
+size 7352

lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/evaluation_metrics.json ADDED Viewed

	@@ -0,0 +1,116 @@

+[
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 1.0,
+        "eval_giou": 0.5344988107681274,
+        "eval_ciou": 0.5989851355552673
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 2.0,
+        "eval_giou": 0.5579254031181335,
+        "eval_ciou": 0.646024227142334
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 3.0,
+        "eval_giou": 0.5501570701599121,
+        "eval_ciou": 0.6018446683883667
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 4.0,
+        "eval_giou": 0.5774487853050232,
+        "eval_ciou": 0.6542478203773499
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 5.0,
+        "eval_giou": 0.5822131037712097,
+        "eval_ciou": 0.6766245365142822
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 6.0,
+        "eval_giou": 0.5897811055183411,
+        "eval_ciou": 0.6791333556175232
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 7.0,
+        "eval_giou": 0.5887703895568848,
+        "eval_ciou": 0.6910147070884705
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 8.0,
+        "eval_giou": 0.5998998880386353,
+        "eval_ciou": 0.6640490293502808
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 9.0,
+        "eval_giou": 0.5920247435569763,
+        "eval_ciou": 0.6693744659423828
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 10.0,
+        "eval_giou": 0.6001232266426086,
+        "eval_ciou": 0.6858417987823486
+    },
+    {
+        "val_dataset": "ReasonSeg|test",
+        "epoch": 10.0,
+        "eval_giou": 0.5927180051803589,
+        "eval_ciou": 0.6138883233070374
+    },
+    {
+        "val_dataset": "refcoco|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7834749817848206,
+        "eval_ciou": 0.790122926235199
+    },
+    {
+        "val_dataset": "refcoco|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.8022208213806152,
+        "eval_ciou": 0.8086150884628296
+    },
+    {
+        "val_dataset": "refcoco|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.7566637396812439,
+        "eval_ciou": 0.7609479427337646
+    },
+    {
+        "val_dataset": "refcoco+|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7318623065948486,
+        "eval_ciou": 0.7281762361526489
+    },
+    {
+        "val_dataset": "refcoco+|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.7749318480491638,
+        "eval_ciou": 0.7748793363571167
+    },
+    {
+        "val_dataset": "refcoco+|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.682511568069458,
+        "eval_ciou": 0.6719024777412415
+    },
+    {
+        "val_dataset": "refcocog|umd|test",
+        "epoch": 10.0,
+        "eval_giou": 0.743724524974823,
+        "eval_ciou": 0.7526366710662842
+    },
+    {
+        "val_dataset": "refcocog|umd|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7407757043838501,
+        "eval_ciou": 0.7478148341178894
+    }
+]

lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/events.out.tfevents.1758558655.bask-pg0308u29a.637997.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb61bef795309a3922462febab004b11ccf980e30eac016b8230fa293a7b7656
+size 212352

lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/runs/Sep22_17-30-52_bask-pg0308u29a/events.out.tfevents.1758558731.bask-pg0308u29a.637997.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e87c13cd165f21e6038c79b21806f6123c013c42bd45ef063c0e1671b8751dd7
+size 116399

lisa-ivl3-2b_bi2cbe_ivs_vlorati_sr/runs/Sep22_17-30-52_bask-pg0308u29a/events.out.tfevents.1758608704.bask-pg0308u29a.637997.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf83b859f6d1900c3189c78baebb5ee0e6400bc6d00390754f89d38c552dfb86
+size 1402

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/ckpt_model/config.json ADDED Viewed

	@@ -0,0 +1,143 @@

+{
+  "architectures": [
+    "InternVL3Self"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_internvl_chat.InternVLChatConfig",
+    "AutoModel": "modeling_internvl_chat.InternVLChatModel",
+    "AutoModelForCausalLM": "modeling_internvl_chat.InternVLChatModel"
+  },
+  "downsample_ratio": 0.5,
+  "dtype": "bfloat16",
+  "dynamic_image_size": true,
+  "eos_token_id": 151645,
+  "force_image_size": 448,
+  "hidden_size": 1536,
+  "image_fold": null,
+  "llm_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "./pretrained/Qwen2.5-32B-Instruct",
+    "architectures": [
+      "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "dtype": "bfloat16",
+    "eos_token_id": 151643,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 70,
+    "model_type": "qwen2",
+    "moe_config": null,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "factor": 2.0,
+      "rope_type": "dynamic",
+      "type": "dynamic"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "use_bfloat16": true,
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151676
+  },
+  "max_dynamic_patch": 12,
+  "min_dynamic_patch": 1,
+  "model_type": "internvl_chat",
+  "output_attentions": false,
+  "pad2square": false,
+  "pad_token_id": 151643,
+  "ps_version": "v2",
+  "select_layer": -1,
+  "system_message": null,
+  "template": "internvl2_5",
+  "tie_word_embeddings": false,
+  "transformers_version": null,
+  "use_backbone_lora": 0,
+  "use_llm_lora": 0,
+  "use_thumbnail": true,
+  "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "OpenGVLab/InternViT-6B-448px-V1-5",
+    "architectures": [
+      "InternVisionModel"
+    ],
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_intern_vit.InternVisionConfig",
+      "AutoModel": "modeling_intern_vit.InternVisionModel"
+    },
+    "capacity_factor": 1.2,
+    "drop_path_rate": 0.1,
+    "dropout": 0.0,
+    "dtype": "bfloat16",
+    "eval_capacity_factor": 1.4,
+    "hidden_act": "gelu",
+    "hidden_size": 1024,
+    "image_size": 448,
+    "initializer_factor": 0.1,
+    "initializer_range": 1e-10,
+    "intermediate_size": 4096,
+    "laux_allreduce": "all_nodes",
+    "layer_norm_eps": 1e-06,
+    "model_type": "intern_vit_6b",
+    "moe_coeff_ratio": 0.5,
+    "moe_intermediate_size": 768,
+    "moe_output_scale": 4.0,
+    "noisy_gate_policy": "RSample_before",
+    "norm_type": "layer_norm",
+    "num_attention_heads": 16,
+    "num_channels": 3,
+    "num_experts": 8,
+    "num_hidden_layers": 24,
+    "num_routed_experts": 4,
+    "num_shared_experts": 4,
+    "patch_size": 14,
+    "qk_normalization": false,
+    "qkv_bias": true,
+    "shared_expert_intermediate_size": 3072,
+    "use_bfloat16": true,
+    "use_flash_attn": true,
+    "use_moe": false,
+    "use_residual": true,
+    "use_rts": false,
+    "use_weighted_residual": false
+  }
+}

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/ckpt_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee127087b96ff9811fbd07f160c2648b5879ccbcd7e88fbf1c57578cc6427656
+size 4211070232

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/ckpt_model/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:faf8b9941672f97b3e8473f3e7078f73367e3fad3a4c4b35b69c5a79104328df
+size 7352

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/evaluation_metrics.json ADDED Viewed

	@@ -0,0 +1,116 @@

+[
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 1.0,
+        "eval_giou": 0.5294323563575745,
+        "eval_ciou": 0.5168058276176453
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 2.0,
+        "eval_giou": 0.5691018104553223,
+        "eval_ciou": 0.5466322302818298
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 3.0,
+        "eval_giou": 0.5456892848014832,
+        "eval_ciou": 0.6087337732315063
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 4.0,
+        "eval_giou": 0.5649483799934387,
+        "eval_ciou": 0.5830232501029968
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 5.0,
+        "eval_giou": 0.5766127109527588,
+        "eval_ciou": 0.592596709728241
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 6.0,
+        "eval_giou": 0.5876106023788452,
+        "eval_ciou": 0.6196873188018799
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 7.0,
+        "eval_giou": 0.5895294547080994,
+        "eval_ciou": 0.5830597281455994
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 8.0,
+        "eval_giou": 0.5922108888626099,
+        "eval_ciou": 0.5886086225509644
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 9.0,
+        "eval_giou": 0.6001683473587036,
+        "eval_ciou": 0.5857241749763489
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 10.0,
+        "eval_giou": 0.6061425805091858,
+        "eval_ciou": 0.6062945127487183
+    },
+    {
+        "val_dataset": "ReasonSeg|test",
+        "epoch": 10.0,
+        "eval_giou": 0.5916463136672974,
+        "eval_ciou": 0.5962467789649963
+    },
+    {
+        "val_dataset": "refcoco|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7914398908615112,
+        "eval_ciou": 0.7944017052650452
+    },
+    {
+        "val_dataset": "refcoco|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.8115019202232361,
+        "eval_ciou": 0.8148282766342163
+    },
+    {
+        "val_dataset": "refcoco|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.7657762169837952,
+        "eval_ciou": 0.7644218802452087
+    },
+    {
+        "val_dataset": "refcoco+|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7408427000045776,
+        "eval_ciou": 0.7323743104934692
+    },
+    {
+        "val_dataset": "refcoco+|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.7806029319763184,
+        "eval_ciou": 0.7790927886962891
+    },
+    {
+        "val_dataset": "refcoco+|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.6951540112495422,
+        "eval_ciou": 0.683707058429718
+    },
+    {
+        "val_dataset": "refcocog|umd|test",
+        "epoch": 10.0,
+        "eval_giou": 0.7511024475097656,
+        "eval_ciou": 0.7564254403114319
+    },
+    {
+        "val_dataset": "refcocog|umd|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7492029070854187,
+        "eval_ciou": 0.7516255378723145
+    }
+]

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/events.out.tfevents.1758821654.bask-pg0308u18a.998112.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f0f6402efa20cb4eb1c3dcaf9815e71b1964b12d1903fcd9a8cfc7ba8fc924f
+size 486

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/events.out.tfevents.1758821976.bask-pg0308u18a.1004472.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b21a9269fe7a0131c65a9b63b6caa674fe4f8b73071b6caa68cc19ce4724062
+size 88

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/events.out.tfevents.1758822179.bask-pg0308u18a.1008370.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28cd9c79f6c1e5c37360f0ca87b6fa4ff89de989a108bdfeadb937195000c169
+size 212352

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-34-12_bask-pg0308u18a/events.out.tfevents.1758821725.bask-pg0308u18a.998112.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb59ce061f378068b22c6735f8430ed9ace878dcac3b831594603aaa1bb107a1
+size 9338

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-39-34_bask-pg0308u18a/events.out.tfevents.1758822035.bask-pg0308u18a.1004472.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2050a14b591ad7960da8a1c578624e5fcadc630a64886750db14457a302231c
+size 9131

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-42-56_bask-pg0308u18a/events.out.tfevents.1758822240.bask-pg0308u18a.1008370.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbc263fde5f12193454e49ef64849b95edfdbe9d84d7748d1bda1f0c04506652
+size 116397

lisa-ivl3-2b_bi2cbe_tb_vlorati_sr/runs/Sep25_18-42-56_bask-pg0308u18a/events.out.tfevents.1758869487.bask-pg0308u18a.1008370.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d1915b5faf4072182ed92a81dc1182e464a0d20fc50e6147b785c025d972e0f
+size 1402

lisa-ivl3-2b_bi2cbe_vlorati_coco/ckpt_model/config.json ADDED Viewed

	@@ -0,0 +1,143 @@

+{
+  "architectures": [
+    "InternVL3Self"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_internvl_chat.InternVLChatConfig",
+    "AutoModel": "modeling_internvl_chat.InternVLChatModel",
+    "AutoModelForCausalLM": "modeling_internvl_chat.InternVLChatModel"
+  },
+  "downsample_ratio": 0.5,
+  "dtype": "bfloat16",
+  "dynamic_image_size": true,
+  "eos_token_id": 151645,
+  "force_image_size": 448,
+  "hidden_size": 1536,
+  "image_fold": null,
+  "llm_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "./pretrained/Qwen2.5-32B-Instruct",
+    "architectures": [
+      "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "dtype": "bfloat16",
+    "eos_token_id": 151643,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 70,
+    "model_type": "qwen2",
+    "moe_config": null,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "factor": 2.0,
+      "rope_type": "dynamic",
+      "type": "dynamic"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "use_bfloat16": true,
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151676
+  },
+  "max_dynamic_patch": 12,
+  "min_dynamic_patch": 1,
+  "model_type": "internvl_chat",
+  "output_attentions": false,
+  "pad2square": false,
+  "pad_token_id": 151643,
+  "ps_version": "v2",
+  "select_layer": -1,
+  "system_message": null,
+  "template": "internvl2_5",
+  "tie_word_embeddings": false,
+  "transformers_version": null,
+  "use_backbone_lora": 0,
+  "use_llm_lora": 0,
+  "use_thumbnail": true,
+  "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "OpenGVLab/InternViT-6B-448px-V1-5",
+    "architectures": [
+      "InternVisionModel"
+    ],
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_intern_vit.InternVisionConfig",
+      "AutoModel": "modeling_intern_vit.InternVisionModel"
+    },
+    "capacity_factor": 1.2,
+    "drop_path_rate": 0.1,
+    "dropout": 0.0,
+    "dtype": "bfloat16",
+    "eval_capacity_factor": 1.4,
+    "hidden_act": "gelu",
+    "hidden_size": 1024,
+    "image_size": 448,
+    "initializer_factor": 0.1,
+    "initializer_range": 1e-10,
+    "intermediate_size": 4096,
+    "laux_allreduce": "all_nodes",
+    "layer_norm_eps": 1e-06,
+    "model_type": "intern_vit_6b",
+    "moe_coeff_ratio": 0.5,
+    "moe_intermediate_size": 768,
+    "moe_output_scale": 4.0,
+    "noisy_gate_policy": "RSample_before",
+    "norm_type": "layer_norm",
+    "num_attention_heads": 16,
+    "num_channels": 3,
+    "num_experts": 8,
+    "num_hidden_layers": 24,
+    "num_routed_experts": 4,
+    "num_shared_experts": 4,
+    "patch_size": 14,
+    "qk_normalization": false,
+    "qkv_bias": true,
+    "shared_expert_intermediate_size": 3072,
+    "use_bfloat16": true,
+    "use_flash_attn": true,
+    "use_moe": false,
+    "use_residual": true,
+    "use_rts": false,
+    "use_weighted_residual": false
+  }
+}

lisa-ivl3-2b_bi2cbe_vlorati_coco/ckpt_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c75bb36d150d76c1aded195dfe0969ac1e5f7b51708e3253890664b3306fe7b6
+size 4211070232

lisa-ivl3-2b_bi2cbe_vlorati_coco/ckpt_model/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:586d01e0f868c297c5556fb5760bb5f53403f37d00934248a1f70708c2bbdc4d
+size 7352

lisa-ivl3-2b_bi2cbe_vlorati_coco/evaluation_metrics.json ADDED Viewed

	@@ -0,0 +1,116 @@

+[
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 1.0,
+        "eval_giou": 0.5369102954864502,
+        "eval_ciou": 0.5064759254455566
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 2.0,
+        "eval_giou": 0.5686467289924622,
+        "eval_ciou": 0.611318051815033
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 3.0,
+        "eval_giou": 0.5613127946853638,
+        "eval_ciou": 0.6206056475639343
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 4.0,
+        "eval_giou": 0.5933331847190857,
+        "eval_ciou": 0.6126891374588013
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 5.0,
+        "eval_giou": 0.6065125465393066,
+        "eval_ciou": 0.6544414162635803
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 6.0,
+        "eval_giou": 0.5995581150054932,
+        "eval_ciou": 0.6379423141479492
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 7.0,
+        "eval_giou": 0.6159911155700684,
+        "eval_ciou": 0.621420681476593
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 8.0,
+        "eval_giou": 0.6243378520011902,
+        "eval_ciou": 0.6523417234420776
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 9.0,
+        "eval_giou": 0.6166976690292358,
+        "eval_ciou": 0.6346321702003479
+    },
+    {
+        "val_dataset": "ReasonSeg|val",
+        "epoch": 10.0,
+        "eval_giou": 0.6171593070030212,
+        "eval_ciou": 0.6407290697097778
+    },
+    {
+        "val_dataset": "ReasonSeg|test",
+        "epoch": 10.0,
+        "eval_giou": 0.5836987495422363,
+        "eval_ciou": 0.6126533150672913
+    },
+    {
+        "val_dataset": "refcoco|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7852296233177185,
+        "eval_ciou": 0.7870670557022095
+    },
+    {
+        "val_dataset": "refcoco|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.8046602010726929,
+        "eval_ciou": 0.8073185086250305
+    },
+    {
+        "val_dataset": "refcoco|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.7577531337738037,
+        "eval_ciou": 0.7593867778778076
+    },
+    {
+        "val_dataset": "refcoco+|unc|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7351171374320984,
+        "eval_ciou": 0.7267892956733704
+    },
+    {
+        "val_dataset": "refcoco+|unc|testA",
+        "epoch": 10.0,
+        "eval_giou": 0.7731851935386658,
+        "eval_ciou": 0.7728055119514465
+    },
+    {
+        "val_dataset": "refcoco+|unc|testB",
+        "epoch": 10.0,
+        "eval_giou": 0.6876177191734314,
+        "eval_ciou": 0.6751795411109924
+    },
+    {
+        "val_dataset": "refcocog|umd|test",
+        "epoch": 10.0,
+        "eval_giou": 0.7494315505027771,
+        "eval_ciou": 0.7570431232452393
+    },
+    {
+        "val_dataset": "refcocog|umd|val",
+        "epoch": 10.0,
+        "eval_giou": 0.7449917197227478,
+        "eval_ciou": 0.750389039516449
+    }
+]

lisa-ivl3-2b_bi2cbe_vlorati_coco/events.out.tfevents.1758236140.bask-pg0309u16a.1220041.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a673a2115871fc802ba01b020cb9f8f61e30b9e9406eedf604c1d500fb25c686
+size 212352

lisa-ivl3-2b_bi2cbe_vlorati_coco/runs/Sep18_23-55-37_bask-pg0309u16a/events.out.tfevents.1758236201.bask-pg0309u16a.1220041.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04a7180c0676429a3801a6fe71e0ec596fc2cff90bfd8a557828056eb13598e1
+size 116395

lisa-ivl3-2b_bi2cbe_vlorati_coco/runs/Sep18_23-55-37_bask-pg0309u16a/events.out.tfevents.1758283609.bask-pg0309u16a.1220041.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad3a469cb6b9847f58a453fce555b48ae34226582d16eaa962b62daec1fe25d6
+size 1402

lisa-ivl3-2b_bi2cbe_vlorati_sr/ckpt_model/config.json ADDED Viewed

	@@ -0,0 +1,143 @@

+{
+  "architectures": [
+    "InternVL3Self"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_internvl_chat.InternVLChatConfig",
+    "AutoModel": "modeling_internvl_chat.InternVLChatModel",
+    "AutoModelForCausalLM": "modeling_internvl_chat.InternVLChatModel"
+  },
+  "downsample_ratio": 0.5,
+  "dtype": "bfloat16",
+  "dynamic_image_size": true,
+  "eos_token_id": 151645,
+  "force_image_size": 448,
+  "hidden_size": 1536,
+  "image_fold": null,
+  "llm_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "./pretrained/Qwen2.5-32B-Instruct",
+    "architectures": [
+      "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "dtype": "bfloat16",
+    "eos_token_id": 151643,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 70,
+    "model_type": "qwen2",
+    "moe_config": null,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "factor": 2.0,
+      "rope_type": "dynamic",
+      "type": "dynamic"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "use_bfloat16": true,
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151676
+  },
+  "max_dynamic_patch": 12,
+  "min_dynamic_patch": 1,
+  "model_type": "internvl_chat",
+  "output_attentions": false,
+  "pad2square": false,
+  "pad_token_id": 151643,
+  "ps_version": "v2",
+  "select_layer": -1,
+  "system_message": null,
+  "template": "internvl2_5",
+  "tie_word_embeddings": false,
+  "transformers_version": null,
+  "use_backbone_lora": 0,
+  "use_llm_lora": 0,
+  "use_thumbnail": true,
+  "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "OpenGVLab/InternViT-6B-448px-V1-5",
+    "architectures": [
+      "InternVisionModel"
+    ],
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_intern_vit.InternVisionConfig",
+      "AutoModel": "modeling_intern_vit.InternVisionModel"
+    },
+    "capacity_factor": 1.2,
+    "drop_path_rate": 0.1,
+    "dropout": 0.0,
+    "dtype": "bfloat16",
+    "eval_capacity_factor": 1.4,
+    "hidden_act": "gelu",
+    "hidden_size": 1024,
+    "image_size": 448,
+    "initializer_factor": 0.1,
+    "initializer_range": 1e-10,
+    "intermediate_size": 4096,
+    "laux_allreduce": "all_nodes",
+    "layer_norm_eps": 1e-06,
+    "model_type": "intern_vit_6b",
+    "moe_coeff_ratio": 0.5,
+    "moe_intermediate_size": 768,
+    "moe_output_scale": 4.0,
+    "noisy_gate_policy": "RSample_before",
+    "norm_type": "layer_norm",
+    "num_attention_heads": 16,
+    "num_channels": 3,
+    "num_experts": 8,
+    "num_hidden_layers": 24,
+    "num_routed_experts": 4,
+    "num_shared_experts": 4,
+    "patch_size": 14,
+    "qk_normalization": false,
+    "qkv_bias": true,
+    "shared_expert_intermediate_size": 3072,
+    "use_bfloat16": true,
+    "use_flash_attn": true,
+    "use_moe": false,
+    "use_residual": true,
+    "use_rts": false,
+    "use_weighted_residual": false
+  }
+}