(oobabooga) [username@archripper llama.cpp] :) $ ./main -m ../text-generation-webui/models/mixtral-8x7b-instruct-v0.1.Q5_K_M.gguf -e -p "[INST] How fast can a Toyota Supra go? [/INST]" --min-p 0.05 --top-p 1.0 -n 10 -ngl 10 Log start main: build = 1632 (70f806b) main: built with cc (GCC) 13.2.1 20230801 for x86_64-pc-linux-gnu main: seed = 1702491481 acquiring VM for da74 using 9 Initialized unreserved SVM apertures: 0x200000 - 0x7fffffffffff mem_handle_aperture start 0x2800000000000, mem_handle_aperture limit 0x3000000000000 [hsaKmtAllocMemory] node 0 [hsaKmtMapMemoryToGPU] address 0x7fe780200000 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe78020a000 flags 0x20040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe78020a000 number of nodes 1 [hsaKmtAllocMemory] node 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe7801fe000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801fe000 number of nodes 1 [hsaKmtGetTileConfig] node 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe7801fc000 flags 0x40 size 0x1000 node_id 0 [hsaKmtQueryPointerInfo] pointer 0x7fe7801fc000 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801fc000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe564600000 flags 0x2040 size 0x101000 node_id 0 [hsaKmtQueryPointerInfo] pointer 0x7fe564600000 [hsaKmtMapMemoryToGPUNodes] address 0x7fe564600000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe564400000 flags 0x2040 size 0x101000 node_id 0 [hsaKmtQueryPointerInfo] pointer 0x7fe564400000 [hsaKmtMapMemoryToGPUNodes] address 0x7fe564400000 number of nodes 1 [hsaKmtAllocMemory] node 1 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748560000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe6e99c0000 flags 0x40 size 0x25000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe6e99c0000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801fa000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe7801f8000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801f8000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f6000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtAllocMemory] node 1 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f4000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe55c200000 flags 0x1040 size 0x2c02000 node_id 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe55c200000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtFreeMemory] address 0x7fe7801f4000 [hsaKmtUnmapMemoryToGPU] address 0x7fe55c200000 [hsaKmtFreeMemory] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtFreeMemory] address 0x7fe7801f6000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f8000 [hsaKmtFreeMemory] address 0x7fe7801f8000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801fa000 [hsaKmtFreeMemory] address 0x7fe7801fa000 [hsaKmtUnmapMemoryToGPU] address 0x7fe748560000 [hsaKmtFreeMemory] address 0x7fe748560000 [hsaKmtUnmapMemoryToGPU] address 0x7fe6e99c0000 [hsaKmtFreeMemory] address 0x7fe6e99c0000 [hsaKmtAllocMemory] node 1 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748a80000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748570000 flags 0x40 size 0x19000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748570000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801fa000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe7801f8000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801f8000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f6000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtAllocMemory] node 1 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f4000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe55c200000 flags 0x1040 size 0x2c02000 node_id 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe55c200000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtFreeMemory] address 0x7fe7801f4000 [hsaKmtUnmapMemoryToGPU] address 0x7fe55c200000 [hsaKmtFreeMemory] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtFreeMemory] address 0x7fe7801f6000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f8000 [hsaKmtFreeMemory] address 0x7fe7801f8000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801fa000 [hsaKmtFreeMemory] address 0x7fe7801fa000 [hsaKmtUnmapMemoryToGPU] address 0x7fe748a80000 [hsaKmtFreeMemory] address 0x7fe748a80000 [hsaKmtUnmapMemoryToGPU] address 0x7fe748570000 [hsaKmtFreeMemory] address 0x7fe748570000 [hsaKmtAllocMemory] node 1 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748570000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748550000 flags 0x40 size 0x1d000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748550000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801fa000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe7801f8000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801f8000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f6000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtAllocMemory] node 1 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f4000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe55c200000 flags 0x1040 size 0x2c02000 node_id 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe55c200000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtFreeMemory] address 0x7fe7801f4000 [hsaKmtUnmapMemoryToGPU] address 0x7fe55c200000 [hsaKmtFreeMemory] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtFreeMemory] address 0x7fe7801f6000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f8000 [hsaKmtFreeMemory] address 0x7fe7801f8000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801fa000 [hsaKmtFreeMemory] address 0x7fe7801fa000 [hsaKmtUnmapMemoryToGPU] address 0x7fe748570000 [hsaKmtFreeMemory] address 0x7fe748570000 [hsaKmtUnmapMemoryToGPU] address 0x7fe748550000 [hsaKmtFreeMemory] address 0x7fe748550000 [hsaKmtAllocMemory] node 1 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748540000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe6e99c0000 flags 0x40 size 0x3e000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe6e99c0000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801fa000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe7801f8000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801f8000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f6000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtAllocMemory] node 1 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801f4000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe55c200000 flags 0x1040 size 0x2c02000 node_id 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe55c200000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f4000 [hsaKmtFreeMemory] address 0x7fe7801f4000 [hsaKmtUnmapMemoryToGPU] address 0x7fe55c200000 [hsaKmtFreeMemory] address 0x7fe55c200000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f6000 [hsaKmtFreeMemory] address 0x7fe7801f6000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801f8000 [hsaKmtFreeMemory] address 0x7fe7801f8000 [hsaKmtUnmapMemoryToGPU] address 0x7fe7801fa000 [hsaKmtFreeMemory] address 0x7fe7801fa000 [hsaKmtUnmapMemoryToGPU] address 0x7fe748540000 [hsaKmtFreeMemory] address 0x7fe748540000 [hsaKmtUnmapMemoryToGPU] address 0x7fe6e99c0000 [hsaKmtFreeMemory] address 0x7fe6e99c0000 [hsaKmtAllocMemory] node 1 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801e8000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748a98000 flags 0x40 size 0xf000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748a98000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801fa000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe7801f8000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe7801f8000 number of nodes 1 [hsaKmtAllocMemory] node 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801e6000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801e6000 [hsaKmtAllocMemory] node 1 [hsaKmtRegisterMemoryToNodes] address 0x7fe7801e4000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe7801e4000 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe55c200000 flags 0x1040 size 0x2c02000 node_id 0 [hsaKmtRegisterMemoryToNodes] address 0x7fe55c200000 number of nodes 1 [hsaKmtMapMemoryToGPU] address 0x7fe55c200000 [hsaKmtAvailableMemory] node 1 [hsaKmtMapMemoryToGPU] address 0x7fe564800000 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748a96000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748a96000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748a92000 flags 0x20040 size 0x2000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748a92000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748a90000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748a90000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748a8e000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748a8e000 number of nodes 1 [hsaKmtAllocMemory] node 0 bind_mem_to_numa mem 0x7fe748a8c000 flags 0x21040 size 0x1000 node_id 0 [hsaKmtMapMemoryToGPUNodes] address 0x7fe748a8c000 number of nodes 1