Upload folder using huggingface_hub

Browse files

Files changed (13) hide show

config.json +7 -7
depth_projector/config.json +1 -1
depth_projector/model.safetensors +1 -1
depth_tower/config.json +1 -1
depth_tower/model.safetensors +1 -1
llm/config.json +1 -1
llm/model.safetensors +1 -1
mm_projector/config.json +1 -1
mm_projector/model.safetensors +1 -1
runs/Jun14_06-32-28_job-9be7e87b-6698-4594-a832-c824906e4803-master-0/events.out.tfevents.1749883238.job-9be7e87b-6698-4594-a832-c824906e4803-master-0 +3 -0
trainer_state.json +0 -0
vision_tower/config.json +1 -1
vision_tower/model.safetensors +1 -1

config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "Ubit": 100,
   "_attn_implementation_autoset": true,
-  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model",
   "architectures": [
     "LlavaLlamaModel"
   ],
@@ -17,7 +17,7 @@
   "depth_projector": "mlp_downsample_3x3_fix",
   "depth_projector_cfg": {
     "_attn_implementation_autoset": false,
-    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/depth_projector",
     "add_cross_attention": false,
     "architectures": [
       "MultimodalProjector"
@@ -85,7 +85,7 @@
   "depth_tower": "/share/project/zhouenshen/hpfs/ckpt/vlm/paligemma-siglip-so400m-patch14-448",
   "depth_tower_cfg": {
     "_attn_implementation_autoset": false,
-    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/depth_tower",
     "add_cross_attention": false,
     "architectures": [
       "SiglipVisionModel"
@@ -185,7 +185,7 @@
   "interpolate_mode": "linear",
   "llm_cfg": {
     "_attn_implementation_autoset": false,
-    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/llm",
     "add_cross_attention": false,
     "architectures": [
       "Qwen2ForCausalLM"
@@ -278,7 +278,7 @@
   "mm_projector": "mlp_downsample_3x3_fix",
   "mm_projector_cfg": {
     "_attn_implementation_autoset": false,
-    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/mm_projector",
     "add_cross_attention": false,
     "architectures": [
       "MultimodalProjector"
@@ -366,7 +366,7 @@
   "refine_mlp_blocksize": false,
   "refine_residual_fp": false,
   "refine_row_blocksize": 4,
-  "resume_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model",
   "row_blocksize": -1,
   "row_blocksize_optimizer": 1,
   "s2": false,
@@ -395,7 +395,7 @@
   "vision_tower": "/share/project/zhouenshen/hpfs/ckpt/vlm/paligemma-siglip-so400m-patch14-448",
   "vision_tower_cfg": {
     "_attn_implementation_autoset": false,
-    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/vision_tower",
     "add_cross_attention": false,
     "architectures": [
       "SiglipVisionModel"

 {
   "Ubit": 100,
   "_attn_implementation_autoset": true,
+  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model",
   "architectures": [
     "LlavaLlamaModel"
   ],
   "depth_projector": "mlp_downsample_3x3_fix",
   "depth_projector_cfg": {
     "_attn_implementation_autoset": false,
+    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/depth_projector",
     "add_cross_attention": false,
     "architectures": [
       "MultimodalProjector"
   "depth_tower": "/share/project/zhouenshen/hpfs/ckpt/vlm/paligemma-siglip-so400m-patch14-448",
   "depth_tower_cfg": {
     "_attn_implementation_autoset": false,
+    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/depth_tower",
     "add_cross_attention": false,
     "architectures": [
       "SiglipVisionModel"
   "interpolate_mode": "linear",
   "llm_cfg": {
     "_attn_implementation_autoset": false,
+    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/llm",
     "add_cross_attention": false,
     "architectures": [
       "Qwen2ForCausalLM"
   "mm_projector": "mlp_downsample_3x3_fix",
   "mm_projector_cfg": {
     "_attn_implementation_autoset": false,
+    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/mm_projector",
     "add_cross_attention": false,
     "architectures": [
       "MultimodalProjector"
   "refine_mlp_blocksize": false,
   "refine_residual_fp": false,
   "refine_row_blocksize": 4,
+  "resume_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model",
   "row_blocksize": -1,
   "row_blocksize_optimizer": 1,
   "s2": false,
   "vision_tower": "/share/project/zhouenshen/hpfs/ckpt/vlm/paligemma-siglip-so400m-patch14-448",
   "vision_tower_cfg": {
     "_attn_implementation_autoset": false,
+    "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/vision_tower",
     "add_cross_attention": false,
     "architectures": [
       "SiglipVisionModel"

depth_projector/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/depth_projector",
   "architectures": [
     "MultimodalProjector"
   ],

 {
+  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/depth_projector",
   "architectures": [
     "MultimodalProjector"
   ],

depth_projector/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04d8d30f7ada9c8912a155a8e3286b4be9f356d57402783d5257cd098a3a0075
 size 87068272

 version https://git-lfs.github.com/spec/v1
+oid sha256:077b99b727dfd07aaf60280baaad16be7560c71c05f0811b58bd5b593aca73d3
 size 87068272

depth_tower/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/depth_tower",
   "architectures": [
     "SiglipVisionModel"
   ],

 {
+  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/depth_tower",
   "architectures": [
     "SiglipVisionModel"
   ],

depth_tower/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8ab0cdbfe8518b7af42d78413b5f41250492b4da2532020e63e76896d16f3565
 size 826707904

 version https://git-lfs.github.com/spec/v1
+oid sha256:640aecc60714538d98ecc6ab817454446075b11c86915d836d0e50e7d5cff6a2
 size 826707904

llm/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/llm",
   "architectures": [
     "Qwen2ForCausalLM"
   ],

 {
+  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/llm",
   "architectures": [
     "Qwen2ForCausalLM"
   ],

llm/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b93b78db7e60f4afe47dfede4f31cb3c4c5df5a10a29a7957a8c1172a96011be
 size 3086594696

 version https://git-lfs.github.com/spec/v1
+oid sha256:0bfb140450d88d5698d7af3ae8c87af7d7d356fdefe94d66a5ff5b319218071d
 size 3086594696

mm_projector/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/mm_projector",
   "architectures": [
     "MultimodalProjector"
   ],

 {
+  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/mm_projector",
   "architectures": [
     "MultimodalProjector"
   ],

mm_projector/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:02752ffd6a4c1d45ca48cfed496f019f43311d09be43f5f1c944eae15e363e3e
 size 87068272

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c84546f1ff8591f43cc2862dd80837d90c83e2c4f2e9cce9f5f951793433f13
 size 87068272

runs/Jun14_06-32-28_job-9be7e87b-6698-4594-a832-c824906e4803-master-0/events.out.tfevents.1749883238.job-9be7e87b-6698-4594-a832-c824906e4803-master-0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c41e42347a0db68c8f9b4a94eabb475bfcbde2b18e864eaf47d46c0f41755ab9
+size 4633872

trainer_state.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

vision_tower/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator-10-nodes/model/vision_tower",
   "architectures": [
     "SiglipVisionModel"
   ],

 {
+  "_name_or_path": "/share/project/zhouenshen/hpfs/code/VILA/runs/train/NVILA-Lite-2B-depth-sft-new_placement+new_simulator/model/vision_tower",
   "architectures": [
     "SiglipVisionModel"
   ],

vision_tower/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ed468183a3f5823cce92e3362c4a3b9e18de39cfec67bc573dfca6bd82df82c
 size 826707904

 version https://git-lfs.github.com/spec/v1
+oid sha256:86c782eccce96224a8e0402a3676bb1dbc3d77b279b3c5392b96e99fe008443d
 size 826707904