File size: 297 Bytes
5bd179e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
#ifndef _tuning_h
#define _tuning_h

struct ExLlamaTuning
{
    int matmul_recons_thd;
    int fused_mlp_thd;
    int sdp_thd;
    bool matmul_fused_remap;

    bool rmsnorm_no_half2;
    bool rope_no_half2;
    bool matmul_no_half2;
    bool silu_no_half2;
    bool concurrent_streams;
};

#endif