FERMI
N.B. this page is under construction
Components
TODO
Launching a DODAS instance of HTCondor for CMS
To lauch an instance of Fermi HTCondor cluster on K8s you should apply simple changes to the HTCondor HELM values indicated either for DODAS (this guide) or plain HELM (this other guide).
The value file template looks as follows:
condorHost: {{ condor_host }}
ccbHost: {{ ccb_address }}
proxyCacheHost: {{ k8s_master_ip }}
ttsCache:
    image: dodasts/tts-cache
    tag: v0.1.3-k8s-12
    iamToken: {{ iam_token }}
    iamClientId: 99f7152a-...-8f27dcbe67e0 
    iamClientSecret: AIEx7S3vA-...-b2lQ8i4Qdv_38o 
htcSchedd:
    image: {{ htcondor_docker_image }}
    tag: v0.1.0-k8s-schedd-3
    networkInterface: {{ schedd_netinterface }}
    persistence:
    storageClass: local-path
    size: 200Gi
    claimSize: 199Gi
    # local-storage for k8s, local-path for k3s
    storageClass: local-storage
    # persistence of the schedd spool directory
    mountPath: /var/lib/condor/spool/
    # mount options
    options: |
        local:
        path: \"/mnt/spool/\"
        nodeAffinity:
        required:
            nodeSelectorTerms:
            - matchExpressions:
                - key: condor
                operator: In
                values:
                    - schedd
htcMaster:
    image: {{ htcondor_docker_image }}
    tag: v0.1.0-k8s-schedd-3
    networkInterface: {{ condor_host }}
htcWn:
    image: {{ htcondor_docker_image }}
    tag: v0.1.0-k8s-fermi-2
    persistentVolume:
    pv:
        name: "data-rclone-1"
        spec: |
        accessModes:
        - ReadWriteMany
        capacity:
            storage: 800Gi
        storageClassName: rclone
        csi:
            driver: csi-rclone
            volumeHandle: data-id
            volumeAttributes:
            remote: "s3"
            remotePath: "home"
            s3-provider: "Minio"
            s3-endpoint: "https://<CHANGEME>:9000"
            s3-access-key-id: "CHANGEME"
            s3-secret-access-key: "CHANGEME"
            no-check-certificate: "true"
            vfs-cache-mode: "writes"
            vfs-cache-max-size: "4G"
            buffer-size: 2G
            vfs-read-chunk-size: "512k"
            vfs-read-chunk-size-limit: "10M"
            no-modtime: "true"
    pvc:
        name: "data-rclone-1"
        mountPath: "/home/Volume_Fermi"
        spec: |
        accessModes:
        - ReadWriteMany
        resources:
            requests:
            storage: "799Gi"
        storageClassName: rclone
        volumeName: data-rclone-1
        selector:
            matchLabels:
            name: data-rclone-1
    # Resource limits and requests
    cpu:
    request: 0.8
    limit: 1.5
    ram:
    request: 1024Mi
    limit: 2048Mi
    # Condor slot type
    slotType: cpus=1, mem=200
cvmfs:
    enabled: true 
    image: cloudpg/cvmfs
    tag: k8s-dev
    pullPolicy: IfNotPresent
    replicas: 1
    # List of repos to be mounted
    repoList: fermi.local.repo 
    privKey: 
    - name: fermi
        filename: fermi.local.repo.pub
        path: \"keys\"
        content: | 
        -----BEGIN PUBLIC KEY-----
        MIIBIjANBgkqhkiG9w0BAQEFAAOCAQ8AMIIBCgKCAQEA5Rezgpvuhl0lyEMFTuKm
        +J2D5KwjzgNLMEMG6dumKb7Zjohy8dxvhHqqH9USQrF570ug+i5pLHcZB66Z0bBC
        -----END PUBLIC KEY-----
    defaultLocalConfig:
    - file: fermi.local.repo.conf
        content: |
        CVMFS_SERVER_URL=http://<CHANGEME>/cvmfs/fermi.local.repo
        CVMFS_PUBLIC_KEY=/etc/cvmfs/keys/fermi.local.repo.pub
        CVMFS_HTTP_PROXY=DIRECT
TODO: put link