| 1234567891011121314151617181920212223242526272829303132333435363738 |
- {
- "estimate": {
- "items": [
- {
- "offloadLayers": 0,
- "fullOffloaded": false,
- "ram": {
- "handleLayers": 32,
- "handleLastLayer": 31,
- "handleOutputLayer": true,
- "remote": false,
- "uma": 1245834200,
- "nonuma": 1403120600
- },
- "vrams": [
- {
- "handleLayers": 0,
- "handleLastLayer": -1,
- "handleOutputLayer": false,
- "remote": false,
- "uma": 0,
- "nonuma": 964157440
- }
- ]
- }
- ],
- "type": "model",
- "architecture": "llama",
- "contextSize": 8192,
- "flashAttention": false,
- "noMMap": false,
- "embeddingOnly": false,
- "reranking": false,
- "distributable": true,
- "logicalBatchSize": 2048,
- "physicalBatchSize": 512
- }
- }
|