Spaces:

maomao88
/

model_structure_viewer

Runtime error

App Files Files Community

maomao88 commited on Sep 27

Commit

119afbd

1 Parent(s): 5850346

more updates

Browse files

Files changed (4) hide show

README.md +1 -1
backend/__pycache__/hf_model_utils.cpython-313.pyc +0 -0
backend/hf_model_utils.py +23 -3
frontend/src/components/ModelInputBar.jsx +1 -1

README.md CHANGED Viewed

@@ -57,7 +57,7 @@ This app is developed using React + Fastapi. You can run this app locally with t
 4. **(Optional) Install GPU-related packages**
-   If you are running on a GPU-enabled device, you can install additional packages (e.g., for faster inference and support for more models):
    ```commandline
    python install_gpu_packages.py

 4. **(Optional) Install GPU-related packages**
+   If you are running on a GPU-enabled device, you can install additional packages (support for more models):
    ```commandline
    python install_gpu_packages.py

backend/__pycache__/hf_model_utils.cpython-313.pyc CHANGED Viewed

Binary files a/backend/__pycache__/hf_model_utils.cpython-313.pyc and b/backend/__pycache__/hf_model_utils.cpython-313.pyc differ

backend/hf_model_utils.py CHANGED Viewed

@@ -3,7 +3,7 @@ import torch.nn as nn
 import json
 import hashlib
 import gc
-from transformers import AutoConfig, AutoModel, AutoModelForCausalLM, AutoModelForMaskedLM
 from accelerate import init_empty_weights
@@ -80,10 +80,30 @@ def get_model_structure(model_name: str, model_type: str | None):
         config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
         with init_empty_weights():
             model = AutoModelForCausalLM.from_config(config, trust_remote_code=True)
-    if model_type == "masked":
-        config = AutoConfig.from_pretrained("model_name")
         with init_empty_weights():
             model = AutoModelForMaskedLM.from_config(config)
     else:
         config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
         with torch.device("meta"):

 import json
 import hashlib
 import gc
+from transformers import AutoConfig, AutoModel, AutoModelForCausalLM, AutoModelForMaskedLM, AutoModelForSequenceClassification, AutoModelForTokenClassification, AutoModelForQuestionAnswering, AutoModelForSeq2SeqLM, AutoModelForImageClassification
 from accelerate import init_empty_weights
         config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
         with init_empty_weights():
             model = AutoModelForCausalLM.from_config(config, trust_remote_code=True)
+    elif model_type == "masked":
+        config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
         with init_empty_weights():
             model = AutoModelForMaskedLM.from_config(config)
+    elif model_type == "sequence":
+        config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
+        with init_empty_weights():
+            model = AutoModelForSequenceClassification.from_config(config)
+    elif model_type == "token":
+        config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
+        with init_empty_weights():
+            model = AutoModelForTokenClassification.from_config(config)
+    elif model_type == "qa":
+        config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
+        with init_empty_weights():
+            model = AutoModelForQuestionAnswering.from_config(config)
+    elif model_type == "s2s":
+        config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
+        with init_empty_weights():
+            model = AutoModelForSeq2SeqLM.from_config(config)
+    elif model_type == "vision":
+        config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
+        with init_empty_weights():
+            model = AutoModelForImageClassification.from_config(config)
     else:
         config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
         with torch.device("meta"):

frontend/src/components/ModelInputBar.jsx CHANGED Viewed

@@ -5,7 +5,7 @@ export default function ModelInputBar({ loading, fetchModelStructure }) {
     const options = [
         { label: "Not Sure", value: "none", default: "deepseek-ai/DeepSeek-V3.1" },
         { label: "Causal Language Models (e.g. GPT, LLaMA, Phi, Mistral)", value: "causal", default: "gpt2"},
-        { label: "Masked Language Models (BERT, RoBERTa, DistilBERT)", value: "masked", default: "distilbert-base-uncased" },
         { label: "Sequence Classification (text classification, sentiment analysis)", value: "sequence", default: "distilbert-base-uncased" },
         { label: "Token Classification (NER, POS tagging)", value: "token",  default: "dbmdz/bert-large-cased-finetuned-conll03-english" },
         { label: "Question Answering Models (e.g. BERT QA, RoBERTa QA)", value: "qa", default: "distilbert-base-uncased-distilled-squad" },

     const options = [
         { label: "Not Sure", value: "none", default: "deepseek-ai/DeepSeek-V3.1" },
         { label: "Causal Language Models (e.g. GPT, LLaMA, Phi, Mistral)", value: "causal", default: "gpt2"},
+        { label: "Masked Language Models (BERT, RoBERTa, DistilBERT)", value: "masked", default: "google-bert/bert-base-uncased" },
         { label: "Sequence Classification (text classification, sentiment analysis)", value: "sequence", default: "distilbert-base-uncased" },
         { label: "Token Classification (NER, POS tagging)", value: "token",  default: "dbmdz/bert-large-cased-finetuned-conll03-english" },
         { label: "Question Answering Models (e.g. BERT QA, RoBERTa QA)", value: "qa", default: "distilbert-base-uncased-distilled-squad" },