Upload model

Browse files

Files changed (3) hide show

README.md +199 -0
config.json +643 -0
model.safetensors +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,199 @@

+---
+library_name: transformers
+tags: []
+---
+# Model Card for Model ID
+<!-- Provide a quick summary of what the model is/does. -->
+## Model Details
+### Model Description
+<!-- Provide a longer summary of what this model is. -->
+This is the model card of a 🤗 transformers model that has been pushed on the Hub. This model card has been automatically generated.
+- **Developed by:** [More Information Needed]
+- **Funded by [optional]:** [More Information Needed]
+- **Shared by [optional]:** [More Information Needed]
+- **Model type:** [More Information Needed]
+- **Language(s) (NLP):** [More Information Needed]
+- **License:** [More Information Needed]
+- **Finetuned from model [optional]:** [More Information Needed]
+### Model Sources [optional]
+<!-- Provide the basic links for the model. -->
+- **Repository:** [More Information Needed]
+- **Paper [optional]:** [More Information Needed]
+- **Demo [optional]:** [More Information Needed]
+## Uses
+<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
+### Direct Use
+<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
+[More Information Needed]
+### Downstream Use [optional]
+<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
+[More Information Needed]
+### Out-of-Scope Use
+<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
+[More Information Needed]
+## Bias, Risks, and Limitations
+<!-- This section is meant to convey both technical and sociotechnical limitations. -->
+[More Information Needed]
+### Recommendations
+<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
+Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
+## How to Get Started with the Model
+Use the code below to get started with the model.
+[More Information Needed]
+## Training Details
+### Training Data
+<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
+[More Information Needed]
+### Training Procedure
+<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
+#### Preprocessing [optional]
+[More Information Needed]
+#### Training Hyperparameters
+- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
+#### Speeds, Sizes, Times [optional]
+<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
+[More Information Needed]
+## Evaluation
+<!-- This section describes the evaluation protocols and provides the results. -->
+### Testing Data, Factors & Metrics
+#### Testing Data
+<!-- This should link to a Dataset Card if possible. -->
+[More Information Needed]
+#### Factors
+<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
+[More Information Needed]
+#### Metrics
+<!-- These are the evaluation metrics being used, ideally with a description of why. -->
+[More Information Needed]
+### Results
+[More Information Needed]
+#### Summary
+## Model Examination [optional]
+<!-- Relevant interpretability work for the model goes here -->
+[More Information Needed]
+## Environmental Impact
+<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
+Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
+- **Hardware Type:** [More Information Needed]
+- **Hours used:** [More Information Needed]
+- **Cloud Provider:** [More Information Needed]
+- **Compute Region:** [More Information Needed]
+- **Carbon Emitted:** [More Information Needed]
+## Technical Specifications [optional]
+### Model Architecture and Objective
+[More Information Needed]
+### Compute Infrastructure
+[More Information Needed]
+#### Hardware
+[More Information Needed]
+#### Software
+[More Information Needed]
+## Citation [optional]
+<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
+**BibTeX:**
+[More Information Needed]
+**APA:**
+[More Information Needed]
+## Glossary [optional]
+<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
+[More Information Needed]
+## More Information [optional]
+[More Information Needed]
+## Model Card Authors [optional]
+[More Information Needed]
+## Model Card Contact
+[More Information Needed]

config.json ADDED Viewed

	@@ -0,0 +1,643 @@

+{
+  "architectures": [
+    "X3DModel"
+  ],
+  "cfg": {
+    "AUG": {
+      "AA_TYPE": "rand-m9-mstd0.5-inc1",
+      "COLOR_JITTER": 0.4,
+      "ENABLE": false,
+      "GEN_MASK_LOADER": false,
+      "INTERPOLATION": "bicubic",
+      "MASK_FRAMES": false,
+      "MASK_RATIO": 0.0,
+      "MASK_TUBE": false,
+      "MASK_WINDOW_SIZE": [
+        8,
+        7,
+        7
+      ],
+      "MAX_MASK_PATCHES_PER_BLOCK": null,
+      "NUM_SAMPLE": 1,
+      "RE_COUNT": 1,
+      "RE_MODE": "pixel",
+      "RE_PROB": 0.25,
+      "RE_SPLIT": false
+    },
+    "AVA": {
+      "ANNOTATION_DIR": "/mnt/vol/gfsai-flash3-east/ai-group/users/haoqifan/ava/frame_list/",
+      "BGR": false,
+      "DETECTION_SCORE_THRESH": 0.9,
+      "EXCLUSION_FILE": "ava_val_excluded_timestamps_v2.2.csv",
+      "FRAME_DIR": "/mnt/fair-flash3-east/ava_trainval_frames.img/",
+      "FRAME_LIST_DIR": "/mnt/vol/gfsai-flash3-east/ai-group/users/haoqifan/ava/frame_list/",
+      "FULL_TEST_ON_VAL": false,
+      "GROUNDTRUTH_FILE": "ava_val_v2.2.csv",
+      "IMG_PROC_BACKEND": "cv2",
+      "LABEL_MAP_FILE": "ava_action_list_v2.2_for_activitynet_2019.pbtxt",
+      "TEST_FORCE_FLIP": false,
+      "TEST_LISTS": [
+        "val.csv"
+      ],
+      "TEST_PREDICT_BOX_LISTS": [
+        "ava_val_predicted_boxes.csv"
+      ],
+      "TRAIN_GT_BOX_LISTS": [
+        "ava_train_v2.2.csv"
+      ],
+      "TRAIN_LISTS": [
+        "train.csv"
+      ],
+      "TRAIN_PCA_JITTER_ONLY": true,
+      "TRAIN_PREDICT_BOX_LISTS": [],
+      "TRAIN_USE_COLOR_AUGMENTATION": false
+    },
+    "BENCHMARK": {
+      "LOG_PERIOD": 100,
+      "NUM_EPOCHS": 5,
+      "SHUFFLE": true
+    },
+    "BN": {
+      "GLOBAL_SYNC": false,
+      "NORM_TYPE": "sync_batchnorm",
+      "NUM_BATCHES_PRECISE": 200,
+      "NUM_SPLITS": 1,
+      "NUM_SYNC_DEVICES": 1,
+      "USE_PRECISE_STATS": true,
+      "WEIGHT_DECAY": 0.0
+    },
+    "CONTRASTIVE": {
+      "BN_MLP": false,
+      "BN_SYNC_MLP": false,
+      "DELTA_CLIPS_MAX": Infinity,
+      "DELTA_CLIPS_MIN": -Infinity,
+      "DIM": 128,
+      "INTERP_MEMORY": false,
+      "KNN_ON": true,
+      "LENGTH": 239975,
+      "LOCAL_SHUFFLE_BN": true,
+      "MEM_TYPE": "1d",
+      "MLP_DIM": 2048,
+      "MOCO_MULTI_VIEW_QUEUE": false,
+      "MOMENTUM": 0.5,
+      "MOMENTUM_ANNEALING": false,
+      "NUM_CLASSES_DOWNSTREAM": 400,
+      "NUM_MLP_LAYERS": 1,
+      "PREDICTOR_DEPTHS": [],
+      "QUEUE_LEN": 65536,
+      "SEQUENTIAL": false,
+      "SIMCLR_DIST_ON": true,
+      "SWAV_QEUE_LEN": 0,
+      "T": 0.07,
+      "TYPE": "mem"
+    },
+    "DATA": {
+      "COLOR_RND_GRAYSCALE": 0.0,
+      "DECODING_BACKEND": "torchvision",
+      "DECODING_SHORT_SIZE": 256,
+      "DUMMY_LOAD": false,
+      "ENSEMBLE_METHOD": "max",
+      "IN22K_TRAINVAL": false,
+      "IN22k_VAL_IN1K": "",
+      "INPUT_CHANNEL_NUM": [
+        3
+      ],
+      "INV_UNIFORM_SAMPLE": true,
+      "IN_VAL_CROP_RATIO": 0.875,
+      "LOADER_CHUNK_OVERALL_SIZE": 0,
+      "LOADER_CHUNK_SIZE": 0,
+      "MEAN": [
+        0.45,
+        0.45,
+        0.45
+      ],
+      "MULTI_LABEL": true,
+      "NUM_FRAMES": 16,
+      "PATH_LABEL_SEPARATOR": " ",
+      "PATH_PREFIX": "kabr/KABR/dataset/image",
+      "PATH_TO_DATA_DIR": "kabr/KABR/annotation",
+      "PATH_TO_PRELOAD_IMDB": "",
+      "RANDOM_FLIP": true,
+      "REVERSE_INPUT_CHANNEL": true,
+      "SAMPLING_RATE": 5,
+      "SKIP_ROWS": 0,
+      "SSL_BLUR_SIGMA_MAX": [
+        0.0,
+        2.0
+      ],
+      "SSL_BLUR_SIGMA_MIN": [
+        0.0,
+        0.1
+      ],
+      "SSL_COLOR_BRI_CON_SAT": [
+        0.2,
+        0.2,
+        0.2
+      ],
+      "SSL_COLOR_HUE": 0.1,
+      "SSL_COLOR_JITTER": true,
+      "SSL_MOCOV2_AUG": false,
+      "STD": [
+        0.225,
+        0.225,
+        0.225
+      ],
+      "TARGET_FPS": 30,
+      "TEST_CROP_SIZE": 300,
+      "TIME_DIFF_PROB": 0.0,
+      "TRAIN_CROP_NUM_SPATIAL": 1,
+      "TRAIN_CROP_NUM_TEMPORAL": 1,
+      "TRAIN_CROP_SIZE": 300,
+      "TRAIN_JITTER_ASPECT_RELATIVE": [],
+      "TRAIN_JITTER_FPS": 0.0,
+      "TRAIN_JITTER_MOTION_SHIFT": false,
+      "TRAIN_JITTER_SCALES": [
+        300,
+        400
+      ],
+      "TRAIN_JITTER_SCALES_RELATIVE": [],
+      "TRAIN_PCA_EIGVAL": [
+        0.225,
+        0.224,
+        0.229
+      ],
+      "TRAIN_PCA_EIGVEC": [
+        [
+          -0.5675,
+          0.7192,
+          0.4009
+        ],
+        [
+          -0.5808,
+          -0.0045,
+          -0.814
+        ],
+        [
+          -0.5836,
+          -0.6948,
+          0.4203
+        ]
+      ],
+      "USE_OFFSET_SAMPLING": false
+    },
+    "DATA_LOADER": {
+      "ENABLE_MULTI_THREAD_DECODE": false,
+      "NUM_WORKERS": 8,
+      "PIN_MEMORY": true
+    },
+    "DEMO": {
+      "BUFFER_SIZE": 0,
+      "CLIP_VIS_SIZE": 10,
+      "COMMON_CLASS_NAMES": [
+        "watch (a person)",
+        "talk to (e.g., self, a person, a group)",
+        "listen to (a person)",
+        "touch (an object)",
+        "carry/hold (an object)",
+        "walk",
+        "sit",
+        "lie/sleep",
+        "bend/bow (at the waist)"
+      ],
+      "COMMON_CLASS_THRES": 0.7,
+      "DETECTRON2_CFG": "COCO-Detection/faster_rcnn_R_50_FPN_3x.yaml",
+      "DETECTRON2_THRESH": 0.9,
+      "DETECTRON2_WEIGHTS": "detectron2://COCO-Detection/faster_rcnn_R_50_FPN_3x/137849458/model_final_280758.pkl",
+      "DISPLAY_HEIGHT": 0,
+      "DISPLAY_WIDTH": 0,
+      "ENABLE": false,
+      "FPS": 30,
+      "GT_BOXES": "",
+      "INPUT_FORMAT": "BGR",
+      "INPUT_VIDEO": "kabr/KABR/dataset/video/G0103.mp4",
+      "LABEL_FILE_PATH": "kabr/KABR/annotation/classes.json",
+      "NUM_CLIPS_SKIP": 1,
+      "NUM_VIS_INSTANCES": 1,
+      "OUTPUT_FILE": "kabr/KABR/dataset/predict/G0103.mp4",
+      "OUTPUT_FPS": -1,
+      "PREDS_BOXES": "",
+      "SLOWMO": 1,
+      "STARTING_SECOND": 900,
+      "THREAD_ENABLE": false,
+      "UNCOMMON_CLASS_THRES": 0.3,
+      "VIS_MODE": "thres",
+      "WEBCAM": -1
+    },
+    "DETECTION": {
+      "ALIGNED": true,
+      "ENABLE": false,
+      "ROI_XFORM_RESOLUTION": 7,
+      "SPATIAL_SCALE_FACTOR": 16
+    },
+    "DIST_BACKEND": "nccl",
+    "LOG_MODEL_INFO": true,
+    "LOG_PERIOD": 10,
+    "MASK": {
+      "DECODER_DEPTH": 0,
+      "DECODER_EMBED_DIM": 512,
+      "DECODER_SEP_POS_EMBED": false,
+      "DEC_KV_KERNEL": [],
+      "DEC_KV_STRIDE": [],
+      "ENABLE": false,
+      "HEAD_TYPE": "separate",
+      "MAE_ON": false,
+      "MAE_RND_MASK": false,
+      "NORM_PRED_PIXEL": true,
+      "PER_FRAME_MASKING": false,
+      "PRED_HOG": false,
+      "PRETRAIN_DEPTH": [
+        15
+      ],
+      "SCALE_INIT_BY_DEPTH": false,
+      "TIME_STRIDE_LOSS": true
+    },
+    "MIXUP": {
+      "ALPHA": 0.8,
+      "CUTMIX_ALPHA": 1.0,
+      "ENABLE": false,
+      "LABEL_SMOOTH_VALUE": 0.1,
+      "PROB": 1.0,
+      "SWITCH_PROB": 0.5
+    },
+    "MODEL": {
+      "ACT_CHECKPOINT": false,
+      "ARCH": "x3d",
+      "DETACH_FINAL_FC": false,
+      "DROPCONNECT_RATE": 0.0,
+      "DROPOUT_RATE": 0.5,
+      "FC_INIT_STD": 0.01,
+      "FP16_ALLREDUCE": false,
+      "FROZEN_BN": false,
+      "HEAD_ACT": "sigmoid",
+      "LOSS_FUNC": "EQL",
+      "MODEL_NAME": "X3D",
+      "MULTI_PATHWAY_ARCH": [
+        "slowfast"
+      ],
+      "NUM_CLASSES": 8,
+      "SINGLE_PATHWAY_ARCH": [
+        "2d",
+        "c2d",
+        "i3d",
+        "slow",
+        "x3d",
+        "mvit",
+        "maskmvit"
+      ]
+    },
+    "MULTIGRID": {
+      "BN_BASE_SIZE": 8,
+      "DEFAULT_B": 0,
+      "DEFAULT_S": 0,
+      "DEFAULT_T": 0,
+      "EPOCH_FACTOR": 1.5,
+      "EVAL_FREQ": 3,
+      "LONG_CYCLE": false,
+      "LONG_CYCLE_FACTORS": [
+        [
+          0.25,
+          0.7071067811865476
+        ],
+        [
+          0.5,
+          0.7071067811865476
+        ],
+        [
+          0.5,
+          1
+        ],
+        [
+          1,
+          1
+        ]
+      ],
+      "LONG_CYCLE_SAMPLING_RATE": 0,
+      "SHORT_CYCLE": false,
+      "SHORT_CYCLE_FACTORS": [
+        0.5,
+        0.7071067811865476
+      ]
+    },
+    "MVIT": {
+      "CLS_EMBED_ON": true,
+      "DEPTH": 16,
+      "DIM_MUL": [],
+      "DIM_MUL_IN_ATT": false,
+      "DROPOUT_RATE": 0.0,
+      "DROPPATH_RATE": 0.1,
+      "EMBED_DIM": 96,
+      "HEAD_INIT_SCALE": 1.0,
+      "HEAD_MUL": [],
+      "LAYER_SCALE_INIT_VALUE": 0.0,
+      "MLP_RATIO": 4.0,
+      "MODE": "conv",
+      "NORM": "layernorm",
+      "NORM_STEM": false,
+      "NUM_HEADS": 1,
+      "PATCH_2D": false,
+      "PATCH_KERNEL": [
+        3,
+        7,
+        7
+      ],
+      "PATCH_PADDING": [
+        2,
+        4,
+        4
+      ],
+      "PATCH_STRIDE": [
+        2,
+        4,
+        4
+      ],
+      "POOL_FIRST": false,
+      "POOL_KVQ_KERNEL": null,
+      "POOL_KV_STRIDE": [],
+      "POOL_KV_STRIDE_ADAPTIVE": null,
+      "POOL_Q_STRIDE": [],
+      "QKV_BIAS": true,
+      "REL_POS_SPATIAL": false,
+      "REL_POS_TEMPORAL": false,
+      "REL_POS_ZERO_INIT": false,
+      "RESIDUAL_POOLING": false,
+      "REV": {
+        "BUFFER_LAYERS": [],
+        "ENABLE": false,
+        "PRE_Q_FUSION": "avg",
+        "RESPATH_FUSE": "concat",
+        "RES_PATH": "conv"
+      },
+      "SEPARATE_QKV": false,
+      "SEP_POS_EMBED": false,
+      "USE_ABS_POS": true,
+      "USE_FIXED_SINCOS_POS": false,
+      "USE_MEAN_POOLING": false,
+      "ZERO_DECAY_POS_CLS": true
+    },
+    "NONLOCAL": {
+      "GROUP": [
+        [
+          1
+        ],
+        [
+          1
+        ],
+        [
+          1
+        ],
+        [
+          1
+        ]
+      ],
+      "INSTANTIATION": "dot_product",
+      "LOCATION": [
+        [
+          []
+        ],
+        [
+          []
+        ],
+        [
+          []
+        ],
+        [
+          []
+        ]
+      ],
+      "POOL": [
+        [
+          [
+            1,
+            2,
+            2
+          ],
+          [
+            1,
+            2,
+            2
+          ]
+        ],
+        [
+          [
+            1,
+            2,
+            2
+          ],
+          [
+            1,
+            2,
+            2
+          ]
+        ],
+        [
+          [
+            1,
+            2,
+            2
+          ],
+          [
+            1,
+            2,
+            2
+          ]
+        ],
+        [
+          [
+            1,
+            2,
+            2
+          ],
+          [
+            1,
+            2,
+            2
+          ]
+        ]
+      ]
+    },
+    "NUM_GPUS": 0,
+    "NUM_SHARDS": 1,
+    "OUTPUT_DIR": "kabr/KABR/logs/x3d-l-kabr",
+    "RESNET": {
+      "DEPTH": 50,
+      "INPLACE_RELU": true,
+      "NUM_BLOCK_TEMP_KERNEL": [
+        [
+          3
+        ],
+        [
+          4
+        ],
+        [
+          6
+        ],
+        [
+          3
+        ]
+      ],
+      "NUM_GROUPS": 1,
+      "SPATIAL_DILATIONS": [
+        [
+          1
+        ],
+        [
+          1
+        ],
+        [
+          1
+        ],
+        [
+          1
+        ]
+      ],
+      "SPATIAL_STRIDES": [
+        [
+          1
+        ],
+        [
+          2
+        ],
+        [
+          2
+        ],
+        [
+          2
+        ]
+      ],
+      "STRIDE_1X1": false,
+      "TRANS_FUNC": "x3d_transform",
+      "WIDTH_PER_GROUP": 64,
+      "ZERO_INIT_FINAL_BN": true,
+      "ZERO_INIT_FINAL_CONV": false
+    },
+    "RNG_SEED": 0,
+    "SHARD_ID": 0,
+    "SLOWFAST": {
+      "ALPHA": 8,
+      "BETA_INV": 8,
+      "FUSION_CONV_CHANNEL_RATIO": 2,
+      "FUSION_KERNEL_SZ": 5
+    },
+    "SOLVER": {
+      "BASE_LR": 0.05,
+      "BASE_LR_SCALE_NUM_SHARDS": true,
+      "BETAS": [
+        0.9,
+        0.999
+      ],
+      "CLIP_GRAD_L2NORM": null,
+      "CLIP_GRAD_VAL": null,
+      "COSINE_AFTER_WARMUP": false,
+      "COSINE_END_LR": 0.0,
+      "DAMPENING": 0.0,
+      "GAMMA": 0.1,
+      "LARS_ON": false,
+      "LAYER_DECAY": 1.0,
+      "LRS": [],
+      "LR_POLICY": "cosine",
+      "MAX_EPOCH": 120,
+      "MOMENTUM": 0.9,
+      "NESTEROV": true,
+      "OPTIMIZING_METHOD": "sgd",
+      "STEPS": [],
+      "STEP_SIZE": 1,
+      "WARMUP_EPOCHS": 35.0,
+      "WARMUP_FACTOR": 0.1,
+      "WARMUP_START_LR": 0.01,
+      "WEIGHT_DECAY": 5e-05,
+      "ZERO_WD_1D_PARAM": false
+    },
+    "TASK": "",
+    "TENSORBOARD": {
+      "CATEGORIES_PATH": "",
+      "CLASS_NAMES_PATH": "kabr/KABR/annotation/classes.json",
+      "CONFUSION_MATRIX": {
+        "ENABLE": true,
+        "FIGSIZE": [
+          8,
+          8
+        ],
+        "SUBSET_PATH": "kabr/KABR/annotation/classes.txt"
+      },
+      "ENABLE": true,
+      "HISTOGRAM": {
+        "ENABLE": true,
+        "FIGSIZE": [
+          8,
+          8
+        ],
+        "SUBSET_PATH": "kabr/KABR/annotation/classes.txt",
+        "TOPK": 3
+      },
+      "LOG_DIR": "",
+      "MODEL_VIS": {
+        "ACTIVATIONS": true,
+        "COLORMAP": "Pastel2",
+        "ENABLE": true,
+        "GRAD_CAM": {
+          "COLORMAP": "viridis",
+          "ENABLE": true,
+          "LAYER_LIST": [
+            "s5/pathway0_res14"
+          ],
+          "USE_TRUE_LABEL": false
+        },
+        "INPUT_VIDEO": true,
+        "LAYER_LIST": [
+          "s5/pathway0_res14"
+        ],
+        "MODEL_WEIGHTS": true,
+        "TOPK_PREDS": 1
+      },
+      "PREDICTIONS_PATH": "",
+      "WRONG_PRED_VIS": {
+        "ENABLE": false,
+        "SUBSET_PATH": "",
+        "TAG": "Incorrectly classified videos."
+      }
+    },
+    "TEST": {
+      "BATCH_SIZE": 64,
+      "CHECKPOINT_FILE_PATH": "",
+      "CHECKPOINT_TYPE": "pytorch",
+      "DATASET": "charades",
+      "ENABLE": false,
+      "NUM_ENSEMBLE_VIEWS": 2,
+      "NUM_SPATIAL_CROPS": 1,
+      "NUM_TEMPORAL_CLIPS": [],
+      "SAVE_RESULTS_PATH": "kabr/KABR/logs/x3d-l-kabr/results.txt"
+    },
+    "TRAIN": {
+      "AUTO_RESUME": true,
+      "BATCH_SIZE": 64,
+      "CHECKPOINT_CLEAR_NAME_PATTERN": [],
+      "CHECKPOINT_EPOCH_RESET": true,
+      "CHECKPOINT_FILE_PATH": "slowfast/projects/x3d/x3d_l.pyth",
+      "CHECKPOINT_INFLATE": false,
+      "CHECKPOINT_IN_INIT": false,
+      "CHECKPOINT_PERIOD": 5,
+      "CHECKPOINT_TYPE": "pytorch",
+      "DATASET": "charades",
+      "ENABLE": true,
+      "EVAL_PERIOD": 5,
+      "KILL_LOSS_EXPLOSION_FACTOR": 0.0,
+      "MIXED_PRECISION": false
+    },
+    "VIS_MASK": {
+      "ENABLE": false
+    },
+    "X3D": {
+      "BN_LIN5": false,
+      "BOTTLENECK_FACTOR": 2.25,
+      "CHANNELWISE_3x3x3": true,
+      "DEPTH_FACTOR": 5.0,
+      "DIM_C1": 12,
+      "DIM_C5": 2048,
+      "SCALE_RES2": false,
+      "WIDTH_FACTOR": 2.0
+    }
+  },
+  "model_type": "x3d",
+  "torch_dtype": "float32",
+  "transformers_version": "4.46.0"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3b84df54f08ad0b9a7858524fdb144229dddcd59b2a82c008b7832a9c6755a9
+size 21795296