cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

goyaP.h (8943B)


      1/* SPDX-License-Identifier: GPL-2.0
      2 *
      3 * Copyright 2016-2022 HabanaLabs, Ltd.
      4 * All Rights Reserved.
      5 *
      6 */
      7
      8#ifndef GOYAP_H_
      9#define GOYAP_H_
     10
     11#include <uapi/misc/habanalabs.h>
     12#include "../common/habanalabs.h"
     13#include "../include/common/hl_boot_if.h"
     14#include "../include/goya/goya_packets.h"
     15#include "../include/goya/goya.h"
     16#include "../include/goya/goya_async_events.h"
     17#include "../include/goya/goya_fw_if.h"
     18
     19#define NUMBER_OF_CMPLT_QUEUES		5
     20#define NUMBER_OF_EXT_HW_QUEUES		5
     21#define NUMBER_OF_CPU_HW_QUEUES		1
     22#define NUMBER_OF_INT_HW_QUEUES		9
     23#define NUMBER_OF_HW_QUEUES		(NUMBER_OF_EXT_HW_QUEUES + \
     24					NUMBER_OF_CPU_HW_QUEUES + \
     25					NUMBER_OF_INT_HW_QUEUES)
     26
     27/*
     28 * Number of MSIX interrupts IDS:
     29 * Each completion queue has 1 ID
     30 * The event queue has 1 ID
     31 */
     32#define NUMBER_OF_INTERRUPTS		(NUMBER_OF_CMPLT_QUEUES + 1)
     33
     34#if (NUMBER_OF_INTERRUPTS > GOYA_MSIX_ENTRIES)
     35#error "Number of MSIX interrupts must be smaller or equal to GOYA_MSIX_ENTRIES"
     36#endif
     37
     38#define QMAN_FENCE_TIMEOUT_USEC		10000		/* 10 ms */
     39
     40#define QMAN_STOP_TIMEOUT_USEC		100000		/* 100 ms */
     41
     42#define CORESIGHT_TIMEOUT_USEC		100000		/* 100 ms */
     43
     44#define GOYA_CPU_TIMEOUT_USEC		15000000	/* 15s */
     45
     46#define TPC_ENABLED_MASK		0xFF
     47
     48#define PLL_HIGH_DEFAULT		1575000000	/* 1.575 GHz */
     49
     50#define MAX_POWER_DEFAULT		200000		/* 200W */
     51
     52#define DC_POWER_DEFAULT		20000		/* 20W */
     53
     54#define DRAM_PHYS_DEFAULT_SIZE		0x100000000ull	/* 4GB */
     55
     56#define GOYA_DEFAULT_CARD_NAME		"HL1000"
     57
     58#define GOYA_MAX_PENDING_CS		64
     59
     60#if !IS_MAX_PENDING_CS_VALID(GOYA_MAX_PENDING_CS)
     61#error "GOYA_MAX_PENDING_CS must be power of 2 and greater than 1"
     62#endif
     63
     64/* DRAM Memory Map */
     65
     66#define CPU_FW_IMAGE_SIZE		0x10000000	/* 256MB */
     67#define MMU_PAGE_TABLES_SIZE		0x0FC00000	/* 252MB */
     68#define MMU_DRAM_DEFAULT_PAGE_SIZE	0x00200000	/* 2MB */
     69#define MMU_CACHE_MNG_SIZE		0x00001000	/* 4KB */
     70
     71#define CPU_FW_IMAGE_ADDR		DRAM_PHYS_BASE
     72#define MMU_PAGE_TABLES_ADDR		(CPU_FW_IMAGE_ADDR + CPU_FW_IMAGE_SIZE)
     73#define MMU_DRAM_DEFAULT_PAGE_ADDR	(MMU_PAGE_TABLES_ADDR + \
     74						MMU_PAGE_TABLES_SIZE)
     75#define MMU_CACHE_MNG_ADDR		(MMU_DRAM_DEFAULT_PAGE_ADDR + \
     76					MMU_DRAM_DEFAULT_PAGE_SIZE)
     77#define DRAM_DRIVER_END_ADDR		(MMU_CACHE_MNG_ADDR + \
     78						MMU_CACHE_MNG_SIZE)
     79
     80#define DRAM_BASE_ADDR_USER		0x20000000
     81
     82#if (DRAM_DRIVER_END_ADDR > DRAM_BASE_ADDR_USER)
     83#error "Driver must reserve no more than 512MB"
     84#endif
     85
     86/*
     87 * SRAM Memory Map for Driver
     88 *
     89 * Driver occupies DRIVER_SRAM_SIZE bytes from the start of SRAM. It is used for
     90 * MME/TPC QMANs
     91 *
     92 */
     93
     94#define MME_QMAN_BASE_OFFSET	0x000000	/* Must be 0 */
     95#define MME_QMAN_LENGTH		64
     96#define TPC_QMAN_LENGTH		64
     97
     98#define TPC0_QMAN_BASE_OFFSET	(MME_QMAN_BASE_OFFSET + \
     99				(MME_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    100#define TPC1_QMAN_BASE_OFFSET	(TPC0_QMAN_BASE_OFFSET + \
    101				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    102#define TPC2_QMAN_BASE_OFFSET	(TPC1_QMAN_BASE_OFFSET + \
    103				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    104#define TPC3_QMAN_BASE_OFFSET	(TPC2_QMAN_BASE_OFFSET + \
    105				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    106#define TPC4_QMAN_BASE_OFFSET	(TPC3_QMAN_BASE_OFFSET + \
    107				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    108#define TPC5_QMAN_BASE_OFFSET	(TPC4_QMAN_BASE_OFFSET + \
    109				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    110#define TPC6_QMAN_BASE_OFFSET	(TPC5_QMAN_BASE_OFFSET + \
    111				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    112#define TPC7_QMAN_BASE_OFFSET	(TPC6_QMAN_BASE_OFFSET + \
    113				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    114
    115#define SRAM_DRIVER_RES_OFFSET	(TPC7_QMAN_BASE_OFFSET + \
    116				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
    117
    118#if (SRAM_DRIVER_RES_OFFSET >= GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START)
    119#error "MME/TPC QMANs SRAM space exceeds limit"
    120#endif
    121
    122#define SRAM_USER_BASE_OFFSET	GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START
    123
    124/* Virtual address space */
    125#define VA_HOST_SPACE_START	0x1000000000000ull	/* 256TB */
    126#define VA_HOST_SPACE_END	0x3FF8000000000ull	/* 1PB - 1TB */
    127#define VA_HOST_SPACE_SIZE	(VA_HOST_SPACE_END - \
    128					VA_HOST_SPACE_START) /* 767TB */
    129
    130#define VA_DDR_SPACE_START	0x800000000ull		/* 32GB */
    131#define VA_DDR_SPACE_END	0x2000000000ull		/* 128GB */
    132#define VA_DDR_SPACE_SIZE	(VA_DDR_SPACE_END - \
    133					VA_DDR_SPACE_START)	/* 128GB */
    134
    135#if (HL_CPU_ACCESSIBLE_MEM_SIZE != SZ_2M)
    136#error "HL_CPU_ACCESSIBLE_MEM_SIZE must be exactly 2MB to enable MMU mapping"
    137#endif
    138
    139#define VA_CPU_ACCESSIBLE_MEM_ADDR	0x8000000000ull
    140
    141#define DMA_MAX_TRANSFER_SIZE	U32_MAX
    142
    143#define HW_CAP_PLL		0x00000001
    144#define HW_CAP_DDR_0		0x00000002
    145#define HW_CAP_DDR_1		0x00000004
    146#define HW_CAP_MME		0x00000008
    147#define HW_CAP_CPU		0x00000010
    148#define HW_CAP_DMA		0x00000020
    149#define HW_CAP_MSIX		0x00000040
    150#define HW_CAP_CPU_Q		0x00000080
    151#define HW_CAP_MMU		0x00000100
    152#define HW_CAP_TPC_MBIST	0x00000200
    153#define HW_CAP_GOLDEN		0x00000400
    154#define HW_CAP_TPC		0x00000800
    155
    156struct goya_work_freq {
    157	struct hl_device *hdev;
    158	struct delayed_work work_freq;
    159};
    160
    161struct goya_device {
    162	/* TODO: remove hw_queues_lock after moving to scheduler code */
    163	spinlock_t	hw_queues_lock;
    164	struct goya_work_freq	*goya_work;
    165
    166	u64		mme_clk;
    167	u64		tpc_clk;
    168	u64		ic_clk;
    169
    170	u64		ddr_bar_cur_addr;
    171	u32		events_stat[GOYA_ASYNC_EVENT_ID_SIZE];
    172	u32		events_stat_aggregate[GOYA_ASYNC_EVENT_ID_SIZE];
    173	u32		hw_cap_initialized;
    174	u8		device_cpu_mmu_mappings_done;
    175
    176	enum hl_pll_frequency		curr_pll_profile;
    177	enum hl_pm_mng_profile		pm_mng_profile;
    178};
    179
    180int goya_set_fixed_properties(struct hl_device *hdev);
    181int goya_mmu_init(struct hl_device *hdev);
    182void goya_init_dma_qmans(struct hl_device *hdev);
    183void goya_init_mme_qmans(struct hl_device *hdev);
    184void goya_init_tpc_qmans(struct hl_device *hdev);
    185int goya_init_cpu_queues(struct hl_device *hdev);
    186void goya_init_security(struct hl_device *hdev);
    187void goya_ack_protection_bits_errors(struct hl_device *hdev);
    188int goya_late_init(struct hl_device *hdev);
    189void goya_late_fini(struct hl_device *hdev);
    190
    191void goya_ring_doorbell(struct hl_device *hdev, u32 hw_queue_id, u32 pi);
    192void goya_pqe_write(struct hl_device *hdev, __le64 *pqe, struct hl_bd *bd);
    193void goya_update_eq_ci(struct hl_device *hdev, u32 val);
    194void goya_restore_phase_topology(struct hl_device *hdev);
    195int goya_context_switch(struct hl_device *hdev, u32 asid);
    196
    197int goya_debugfs_i2c_read(struct hl_device *hdev, u8 i2c_bus,
    198			u8 i2c_addr, u8 i2c_reg, u32 *val);
    199int goya_debugfs_i2c_write(struct hl_device *hdev, u8 i2c_bus,
    200			u8 i2c_addr, u8 i2c_reg, u32 val);
    201void goya_debugfs_led_set(struct hl_device *hdev, u8 led, u8 state);
    202
    203int goya_test_queue(struct hl_device *hdev, u32 hw_queue_id);
    204int goya_test_queues(struct hl_device *hdev);
    205int goya_test_cpu_queue(struct hl_device *hdev);
    206int goya_send_cpu_message(struct hl_device *hdev, u32 *msg, u16 len,
    207				u32 timeout, u64 *result);
    208
    209long goya_get_temperature(struct hl_device *hdev, int sensor_index, u32 attr);
    210long goya_get_voltage(struct hl_device *hdev, int sensor_index, u32 attr);
    211long goya_get_current(struct hl_device *hdev, int sensor_index, u32 attr);
    212long goya_get_fan_speed(struct hl_device *hdev, int sensor_index, u32 attr);
    213long goya_get_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr);
    214void goya_set_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr,
    215			long value);
    216u64 goya_get_max_power(struct hl_device *hdev);
    217void goya_set_max_power(struct hl_device *hdev, u64 value);
    218
    219void goya_set_pll_profile(struct hl_device *hdev, enum hl_pll_frequency freq);
    220void goya_add_device_attr(struct hl_device *hdev, struct attribute_group *dev_clk_attr_grp,
    221				struct attribute_group *dev_vrm_attr_grp);
    222int goya_cpucp_info_get(struct hl_device *hdev);
    223int goya_debug_coresight(struct hl_device *hdev, struct hl_ctx *ctx, void *data);
    224void goya_halt_coresight(struct hl_device *hdev, struct hl_ctx *ctx);
    225
    226int goya_suspend(struct hl_device *hdev);
    227int goya_resume(struct hl_device *hdev);
    228
    229void goya_handle_eqe(struct hl_device *hdev, struct hl_eq_entry *eq_entry);
    230void *goya_get_events_stat(struct hl_device *hdev, bool aggregate, u32 *size);
    231
    232void goya_add_end_of_cb_packets(struct hl_device *hdev, void *kernel_address,
    233				u32 len, u64 cq_addr, u32 cq_val, u32 msix_vec,
    234				bool eb);
    235int goya_cs_parser(struct hl_device *hdev, struct hl_cs_parser *parser);
    236int goya_scrub_device_mem(struct hl_device *hdev, u64 addr, u64 size);
    237void *goya_get_int_queue_base(struct hl_device *hdev, u32 queue_id,
    238				dma_addr_t *dma_handle,	u16 *queue_len);
    239u32 goya_get_dma_desc_list_size(struct hl_device *hdev, struct sg_table *sgt);
    240int goya_send_heartbeat(struct hl_device *hdev);
    241void *goya_cpu_accessible_dma_pool_alloc(struct hl_device *hdev, size_t size,
    242					dma_addr_t *dma_handle);
    243void goya_cpu_accessible_dma_pool_free(struct hl_device *hdev, size_t size,
    244					void *vaddr);
    245void goya_mmu_remove_device_cpu_mappings(struct hl_device *hdev);
    246
    247u32 goya_get_queue_id_for_cq(struct hl_device *hdev, u32 cq_idx);
    248u64 goya_get_device_time(struct hl_device *hdev);
    249int goya_set_frequency(struct hl_device *hdev, enum hl_pll_frequency freq);
    250
    251#endif /* GOYAP_H_ */