Spaces:

SEUyishu
/

MatDeepLearn

Sleeping

App Files Files Community

SEUyishu commited on Dec 3, 2025

Commit

bec0b04

verified ·

1 Parent(s): 778fec6

Upload 3 files

Browse files

Files changed (3) hide show

Dockerfile +40 -0
app.py +91 -0
config.yml +248 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,40 @@

+FROM python:3.10-slim
+# Create non-root user for HuggingFace Space
+RUN useradd -m -u 1000 user && \
+    apt-get update && \
+    apt-get install -y --no-install-recommends \
+        build-essential \
+        git \
+    && rm -rf /var/lib/apt/lists/* && \
+    python -m pip install --upgrade pip
+USER user
+ENV PATH="/home/user/.local/bin:$PATH"
+ENV HOME="/home/user"
+WORKDIR /app
+# Copy requirements first for better caching
+COPY --chown=user ./mcp_output/requirements.txt /app/requirements.txt
+RUN pip install --no-cache-dir --upgrade -r requirements.txt
+# Copy the entire MatDeepLearn project
+COPY --chown=user . /app
+# Set Python path to include MatDeepLearn
+ENV PYTHONPATH=/app:$PYTHONPATH
+# Expose HuggingFace default port
+EXPOSE 7860
+# Set environment variables for MCP service
+ENV MCP_TRANSPORT=http
+ENV MCP_PORT=7860
+# Health check
+HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
+    CMD python -c "import urllib.request; urllib.request.urlopen('http://localhost:7860/health')" || exit 1
+# Start MCP service
+CMD ["python", "mcp_output/start_mcp.py"]

app.py ADDED Viewed

	@@ -0,0 +1,91 @@

+"""
+MatDeepLearn MCP Service - HuggingFace Space Entry Point
+This file provides a FastAPI application for health checks and service info.
+The actual MCP service is started via start_mcp.py.
+"""
+from fastapi import FastAPI
+from fastapi.responses import JSONResponse
+import os
+import sys
+# Add project to path
+project_root = os.path.dirname(os.path.abspath(__file__))
+if project_root not in sys.path:
+    sys.path.insert(0, project_root)
+app = FastAPI(
+    title="MatDeepLearn MCP Service",
+    description="Graph Neural Networks for Materials Property Prediction",
+    version="1.0.0"
+)
+@app.get("/")
+async def root():
+    """Root endpoint with service information."""
+    return {
+        "status": "ok",
+        "service": "MatDeepLearn MCP Service",
+        "description": "Graph Neural Networks for Materials Property Prediction",
+        "transport": os.environ.get("MCP_TRANSPORT", "stdio"),
+        "available_models": [
+            "CGCNN_demo", "MPNN_demo", "SchNet_demo",
+            "MEGNet_demo", "GCN_demo", "SOAP_demo", "SM_demo"
+        ]
+    }
+@app.get("/health")
+async def health():
+    """Health check endpoint."""
+    try:
+        import torch
+        gpu_available = torch.cuda.is_available()
+    except:
+        gpu_available = False
+    return {
+        "status": "healthy",
+        "gpu_available": gpu_available
+    }
+@app.get("/info")
+async def info():
+    """Detailed service information."""
+    try:
+        import torch
+        torch_version = torch.__version__
+        gpu_available = torch.cuda.is_available()
+        gpu_count = torch.cuda.device_count() if gpu_available else 0
+    except:
+        torch_version = "N/A"
+        gpu_available = False
+        gpu_count = 0
+    return {
+        "service": "MatDeepLearn MCP Service",
+        "version": "1.0.0",
+        "torch_version": torch_version,
+        "gpu_available": gpu_available,
+        "gpu_count": gpu_count,
+        "mcp_tools": [
+            "check_environment",
+            "list_available_models",
+            "get_model_config",
+            "process_structure_data",
+            "train_model",
+            "predict_properties",
+            "cross_validation",
+            "analyze_structure",
+            "compare_models",
+            "get_dataset_info"
+        ]
+    }
+if __name__ == "__main__":
+    import uvicorn
+    port = int(os.environ.get("PORT", "7860"))
+    uvicorn.run(app, host="0.0.0.0", port=port)

config.yml ADDED Viewed

	@@ -0,0 +1,248 @@

+Job:
+    run_mode: "Training"
+    #{Training, Predict, Repeat, CV, Hyperparameter, Ensemble, Analysis}
+    Training:
+        job_name: "my_train_job"
+        reprocess: "False"
+        model: CGCNN_demo
+        load_model: "False"
+        save_model: "True"
+        model_path: "my_model.pth"
+        write_output: "True"
+        parallel: "True"
+        #seed=0 means random initalization
+        seed: 0
+    Predict:
+        job_name: "my_predict_job"
+        reprocess: "False"
+        model_path: "my_model.pth"
+        write_output: "True"
+        seed: 0
+    Repeat:
+        job_name: "my_repeat_job"
+        reprocess: "False"
+        model: CGCNN_demo
+        model_path: "my_model.pth"
+        write_output: "False"
+        parallel: "True"
+        seed: 0
+        ###specific options
+        #number of repeat trials
+        repeat_trials: 5
+    CV:
+        job_name: "my_CV_job"
+        reprocess: "False"
+        model: CGCNN_demo
+        write_output: "True"
+        parallel: "True"
+        seed: 0
+        ###specific options
+        #number of folds for n-fold CV
+        cv_folds: 5
+    Hyperparameter:
+        job_name: "my_hyperparameter_job"
+        reprocess: "False"
+        model: CGCNN_demo
+        seed: 0
+        ###specific options
+        hyper_trials: 10
+        #number of concurrent trials (can be greater than number of GPUs)
+        hyper_concurrency: 8
+        #frequency of checkpointing and update (default: 1)
+        hyper_iter: 1
+        #resume a previous hyperparameter optimization run
+        hyper_resume: "True"
+        #Verbosity of ray tune output; available: (1, 2, 3)
+        hyper_verbosity: 1
+        #Delete processed datasets
+        hyper_delete_processed: "True"
+    Ensemble:
+        job_name: "my_ensemble_job"
+        reprocess: "False"
+        save_model: "False"
+        model_path: "my_model.pth"
+        write_output: "Partial"
+        parallel: "True"
+        seed: 0
+        ###specific options
+        #List of models to use: (Example: "CGCNN_demo,MPNN_demo,SchNet_demo,MEGNet_demo" or "CGCNN_demo,CGCNN_demo,CGCNN_demo,CGCNN_demo")
+        ensemble_list: "CGCNN_demo,CGCNN_demo,CGCNN_demo,CGCNN_demo,CGCNN_demo"
+    Analysis:
+        job_name: "my_job"
+        reprocess: "False"
+        model: CGCNN_demo
+        model_path: "my_model.pth"
+        write_output: "True"
+        seed: 0
+Processing:
+    #Whether to use "inmemory" or "large" format for pytorch-geometric dataset. Reccomend inmemory unless the dataset is too large
+    dataset_type: "inmemory"
+    #Path to data files
+    data_path: "/data"
+    #Path to target file within data_path
+    target_path: "targets.csv"
+    #Method of obtaining atom idctionary: available:(provided, default, blank, generated)
+    dictionary_source: "default"
+    #Path to atom dictionary file within data_path
+    dictionary_path: "atom_dict.json"
+    #Format of data files (limit to those supported by ASE)
+    data_format: "json"
+    #Print out processing info
+    verbose: "True"
+    #graph specific settings
+    graph_max_radius : 8.0
+    graph_max_neighbors : 12
+    voronoi: "False"
+    edge_features: "True"
+    graph_edge_length : 50
+    #SM specific settings
+    SM_descriptor: "False"
+    #SOAP specific settings
+    SOAP_descriptor: "False"
+    SOAP_rcut : 8.0
+    SOAP_nmax : 6
+    SOAP_lmax : 4
+    SOAP_sigma : 0.3
+Training:
+    #Index of target column in targets.csv
+    target_index: 0
+    #Loss functions (from pytorch) examples: l1_loss, mse_loss, binary_cross_entropy
+    loss: "l1_loss"
+    #Ratios for train/val/test split out of a total of 1
+    train_ratio: 0.8
+    val_ratio: 0.05
+    test_ratio: 0.15
+    #Training print out frequency (print per n number of epochs)
+    verbosity: 5
+Models:
+    CGCNN_demo:
+        model: CGCNN
+        dim1: 100
+        dim2: 150
+        pre_fc_count: 1
+        gc_count: 4
+        post_fc_count: 3
+        pool: "global_mean_pool"
+        pool_order: "early"
+        batch_norm: "True"
+        batch_track_stats: "True"
+        act: "relu"
+        dropout_rate: 0.0
+        epochs: 250
+        lr: 0.002
+        batch_size: 100
+        optimizer: "AdamW"
+        optimizer_args: {}
+        scheduler: "ReduceLROnPlateau"
+        scheduler_args: {"mode":"min", "factor":0.8, "patience":10, "min_lr":0.00001, "threshold":0.0002}
+    MPNN_demo:
+        model: MPNN
+        dim1: 100
+        dim2: 100
+        dim3: 100
+        pre_fc_count: 1
+        gc_count: 4
+        post_fc_count: 3
+        pool: "global_mean_pool"
+        pool_order: "early"
+        batch_norm: "True"
+        batch_track_stats: "True"
+        act: "relu"
+        dropout_rate: 0.0
+        epochs: 250
+        lr: 0.001
+        batch_size: 100
+        optimizer: "AdamW"
+        optimizer_args: {}
+        scheduler: "ReduceLROnPlateau"
+        scheduler_args: {"mode":"min", "factor":0.8, "patience":10, "min_lr":0.00001, "threshold":0.0002}
+    SchNet_demo:
+        model: SchNet
+        dim1: 100
+        dim2: 100
+        dim3: 150
+        cutoff: 8
+        pre_fc_count: 1
+        gc_count: 4
+        post_fc_count: 3
+        pool: "global_mean_pool"
+        pool_order: "early"
+        batch_norm: "True"
+        batch_track_stats: "True"
+        act: "relu"
+        dropout_rate: 0.0
+        epochs: 250
+        lr: 0.0005
+        batch_size: 100
+        optimizer: "AdamW"
+        optimizer_args: {}
+        scheduler: "ReduceLROnPlateau"
+        scheduler_args: {"mode":"min", "factor":0.8, "patience":10, "min_lr":0.00001, "threshold":0.0002}
+    MEGNet_demo:
+        model: MEGNet
+        dim1: 100
+        dim2: 100
+        dim3: 100
+        pre_fc_count: 1
+        gc_count: 4
+        gc_fc_count: 1
+        post_fc_count: 3
+        pool: "global_mean_pool"
+        pool_order: "early"
+        batch_norm: "True"
+        batch_track_stats: "True"
+        act: "relu"
+        dropout_rate: 0.0
+        epochs: 250
+        lr: 0.0005
+        batch_size: 100
+        optimizer: "AdamW"
+        optimizer_args: {}
+        scheduler: "ReduceLROnPlateau"
+        scheduler_args: {"mode":"min", "factor":0.8, "patience":10, "min_lr":0.00001, "threshold":0.0002}
+    GCN_demo:
+        model: GCN
+        dim1: 100
+        dim2: 150
+        pre_fc_count: 1
+        gc_count: 4
+        post_fc_count: 3
+        pool: "global_mean_pool"
+        pool_order: "early"
+        batch_norm: "True"
+        batch_track_stats: "True"
+        act: "relu"
+        dropout_rate: 0.0
+        epochs: 250
+        lr: 0.002
+        batch_size: 100
+        optimizer: "AdamW"
+        optimizer_args: {}
+        scheduler: "ReduceLROnPlateau"
+        scheduler_args: {"mode":"min", "factor":0.8, "patience":10, "min_lr":0.00001, "threshold":0.0002}
+    SM_demo:
+        model: SM
+        dim1: 100
+        fc_count: 2
+        epochs: 200
+        lr: 0.002
+        batch_size: 100
+        optimizer: "AdamW"
+        optimizer_args: {}
+        scheduler: "ReduceLROnPlateau"
+        scheduler_args: {"mode":"min", "factor":0.8, "patience":10, "min_lr":0.00001, "threshold":0.0002}
+    SOAP_demo:
+        model: SOAP
+        dim1: 100
+        fc_count: 2
+        epochs: 200
+        lr: 0.002
+        batch_size: 100
+        optimizer: "AdamW"
+        optimizer_args: {}
+        scheduler: "ReduceLROnPlateau"
+        scheduler_args: {"mode":"min", "factor":0.8, "patience":10, "min_lr":0.00001, "threshold":0.0002}