| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546 |
- {
- "estimate": {
- "items": [
- {
- "offloadLayers": 81,
- "fullOffloaded": true,
- "ram": {
- "handleLayers": 0,
- "handleLastLayer": -1,
- "handleOutputLayer": false,
- "remote": false,
- "uma": 297878712,
- "nonuma": 455165112
- },
- "vrams": [
- {
- "handleLayers": 41,
- "handleLastLayer": 40,
- "handleOutputLayer": false,
- "remote": false,
- "uma": 1342723072,
- "nonuma": 22912443392
- },
- {
- "handleLayers": 39,
- "handleLastLayer": 79,
- "handleOutputLayer": true,
- "remote": false,
- "uma": 22649753600,
- "nonuma": 22911897600
- }
- ]
- }
- ],
- "type": "model",
- "architecture": "llama",
- "contextSize": 8192,
- "flashAttention": false,
- "noMMap": false,
- "embeddingOnly": false,
- "reranking": false,
- "distributable": true,
- "logicalBatchSize": 2048,
- "physicalBatchSize": 512
- }
- }
|