components/esp_psram/esp32/esp_himem.c (ESP-IDF)

Outline

#include "freertos/FreeRTOS.h"

#include "freertos/task.h"

#include "esp_psram.h"

#include "esp_private/esp_psram_extram.h"

#include "esp32/rom/cache.h"

#include "sdkconfig.h"

#include "esp32/himem.h"

#include "soc/soc.h"

#include "esp_log.h"

#include "esp_check.h"

#include "../esp_psram_impl.h"

#define SPIRAM_BANKSWITCH_RESERVE

#define CACHE_BLOCKSIZE

#define VIRT_HIMEM_RANGE_START

#define VIRT_HIMEM_RANGE_BLOCKSTART

#define PHYS_HIMEM_BLOCKSTART

#define TAG

ramblock_t

rangeblock_t

s_ram_descriptor

s_range_descriptor

s_ramblockcnt

s_rangeblockcnt

esp_himem_rangedata_t

esp_himem_ramdata_t

spinlock

ramblock_idx_valid(int)

rangeblock_idx_valid(int)

set_bank(int, int, int)

esp_himem_get_phys_size()

esp_himem_get_free_size()

esp_himem_reserved_area_size()

esp_himem_init()

allocate_blocks(int, uint16_t *)

esp_himem_alloc(size_t, esp_himem_handle_t *)

esp_himem_free(esp_himem_handle_t)

esp_himem_alloc_map_range(size_t, esp_himem_rangehandle_t *)

esp_himem_free_map_range(esp_himem_rangehandle_t)

esp_himem_map(esp_himem_handle_t, esp_himem_rangehandle_t, size_t, size_t, size_t, int, void **)

esp_himem_unmap(esp_himem_rangehandle_t, void *, size_t)

Files

ESP-IDF

components

app_trace

app_update

bootloader_support

cmock

console

cxx

driver

efuse

esp_adc

esp_app_format

esp_bootloader_format

esp_coex

esp_common

esp_driver_ana_cmpr

esp_driver_cam

esp_driver_dac

esp_driver_gpio

esp_driver_gptimer

esp_driver_i2c

esp_driver_i2s

esp_driver_jpeg

esp_driver_ledc

esp_driver_mcpwm

esp_driver_parlio

esp_driver_pcnt

esp_driver_rmt

esp_driver_sdio

esp_driver_sdm

esp_driver_sdmmc

esp_driver_sdspi

esp_driver_spi

esp_driver_tsens

esp_driver_uart

esp_driver_usb_serial_jtag

esp_eth

esp_event

esp_gdbstub

esp_hid

esp_http_client

esp_http_server

esp_https_ota

esp_https_server

esp_hw_support

esp_lcd

esp_local_ctrl

esp_mm

esp_netif

esp_partition

esp_phy

esp_pm

esp_psram

esp32

esp_himem.c

esp_psram_extram_cache.c

esp_psram_impl_quad.c

include

esp_psram_impl.h

esp_psram.c

esp_ringbuf

esp_rom

esp_security

esp_system

esp_timer

esp_vfs_console

esp_wifi

esp-tls

espcoredump

hal

heap

http_parser

ieee802154

log

mqtt

newlib

nvs_flash

nvs_sec_provider

openthread

perfmon

protobuf-c

protocomm

pthread

sdmmc

soc

spi_flash

spiffs

tcp_transport

ulp

unity

vfs

wear_levelling

wifi_provisioning

wpa_supplicant

xtensa

examples

lwIP

FreeRTOS

cJSON

mbedTLS

SourceVuESP-IDF Framework and ExamplesESP-IDFcomponents/esp_psram/esp32/esp_himem.c

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

/* * SPDX-FileCopyrightText: 2018-2024 Espressif Systems (Shanghai) CO LTD * * SPDX-License-Identifier: Apache-2.0 */ #include "freertos/FreeRTOS.h" #include "freertos/task.h" #include "esp_psram.h" #include "esp_private/esp_psram_extram.h" #include "esp32/rom/cache.h" #include "sdkconfig.h" #include "esp32/himem.h" #include "soc/soc.h" #include "esp_log.h" #include "esp_check.h" #include "../esp_psram_impl.h" /* So, why does the API look this way and is so inflexible to not allow any maps beyond the full 32K chunks? Most of it has to do with the fact that the cache works on the *virtual* addresses What this comes down to is that while it's allowed to map a range of physical memory into the address space two times, there's no cache consistency between the two regions. This means that a write to region A may or may not show up, perhaps delayed, in region B, as it depends on the time that the writeback to SPI RAM is done on A and the time before the corresponding cache line is invalidated on B. Note that this goes for every 32-byte cache line: this implies that if a program writes to address X and Y within A, the write to Y may show up before the write to X does. It gets even worse when both A and B are written: theoretically, a write to a 32-byte cache line in A can be entirely undone because of a write to a different address in B that happens to be in the same 32-byte cache line. Because of these reasons, we do not allow double mappings at all. This, however, has other implications that make supporting ranges not really useful. Because the lack of double mappings, applications will need to do their own management of mapped regions, meaning they will normally map in and out blocks at a time anyway, as mapping more fluent regions would result in the chance of accidentally mapping two overlapping regions. As this is the case, to keep the code simple, at the moment we just force these blocks to be equal to the 32K MMU page size. The API itself does allow for more granular allocations, so if there's a pressing need for a more complex solution in the future, we can do this. Note: In the future, we can expand on this api to do a memcpy() between SPI RAM and (internal) memory using the SPI1 peripheral. This needs support for SPI1 to be in the SPI driver, however. */ #if CONFIG_SPIRAM_BANKSWITCH_ENABLE #define SPIRAM_BANKSWITCH_RESERVE CONFIG_SPIRAM_BANKSWITCH_RESERVE #else #define SPIRAM_BANKSWITCH_RESERVE 0 #endif #define CACHE_BLOCKSIZE (32*1024) //Start of the virtual address range reserved for himem use #define VIRT_HIMEM_RANGE_START (SOC_EXTRAM_DATA_LOW+(128-SPIRAM_BANKSWITCH_RESERVE)*CACHE_BLOCKSIZE) //Start MMU block reserved for himem use #define VIRT_HIMEM_RANGE_BLOCKSTART (128-SPIRAM_BANKSWITCH_RESERVE) //Start physical block #define PHYS_HIMEM_BLOCKSTART (128-SPIRAM_BANKSWITCH_RESERVE) #define TAG "esp_himem" // Metadata for a block of physical RAM typedef struct { unsigned int is_alloced: 1; unsigned int is_mapped: 1; } ramblock_t; //Metadata for a 32-K memory address range typedef struct { unsigned int is_alloced: 1; unsigned int is_mapped: 1; unsigned int ram_block: 16; } rangeblock_t; static ramblock_t *s_ram_descriptor = NULL; static rangeblock_t *s_range_descriptor = NULL; static int s_ramblockcnt = 0; static const int s_rangeblockcnt = SPIRAM_BANKSWITCH_RESERVE; //Handle for a window of address space typedef struct esp_himem_rangedata_t { int block_ct; int block_start; } esp_himem_rangedata_t; //Handle for a range of physical memory typedef struct esp_himem_ramdata_t { int block_ct; uint16_t *block; } esp_himem_ramdata_t; static portMUX_TYPE spinlock = portMUX_INITIALIZER_UNLOCKED; static inline int ramblock_idx_valid(int ramblock_idx) { return (ramblock_idx >= 0 && ramblock_idx < s_ramblockcnt); } static inline int rangeblock_idx_valid(int rangeblock_idx) { return (rangeblock_idx >= 0 && rangeblock_idx < s_rangeblockcnt); } static void set_bank(int virt_bank, int phys_bank, int ct) { int r __attribute__((unused)); r = cache_sram_mmu_set(0, 0, SOC_EXTRAM_DATA_LOW + CACHE_BLOCKSIZE * virt_bank, phys_bank * CACHE_BLOCKSIZE, 32, ct); assert(r == 0); r = cache_sram_mmu_set(1, 0, SOC_EXTRAM_DATA_LOW + CACHE_BLOCKSIZE * virt_bank, phys_bank * CACHE_BLOCKSIZE, 32, ct); assert(r == 0); } size_t esp_himem_get_phys_size(void) { int paddr_start = (4096 * 1024) - (CACHE_BLOCKSIZE * SPIRAM_BANKSWITCH_RESERVE); uint32_t psram_available_size = 0; esp_psram_impl_get_available_size(&psram_available_size); return psram_available_size - paddr_start; } size_t esp_himem_get_free_size(void) { size_t ret = 0; for (int i = 0; i < s_ramblockcnt; i++) { if (!s_ram_descriptor[i].is_alloced) { ret += CACHE_BLOCKSIZE; } } return ret; } size_t esp_himem_reserved_area_size(void) { return CACHE_BLOCKSIZE * SPIRAM_BANKSWITCH_RESERVE; } #if SPIRAM_BANKSWITCH_RESERVE > 0 void __attribute__((constructor)) esp_himem_init(void) { uint32_t maxram = 0; esp_psram_impl_get_available_size(&maxram); //catch double init ESP_RETURN_ON_FALSE(s_ram_descriptor == NULL,, TAG, "already initialized"); //Looks weird; last arg is empty so it expands to 'return ;' ESP_RETURN_ON_FALSE(s_range_descriptor == NULL,, TAG, "already initialized"); //need to have some reserved banks ESP_RETURN_ON_FALSE(SPIRAM_BANKSWITCH_RESERVE != 0,, TAG, "No banks reserved for himem"); //Start and end of physical reserved memory. Note it starts slightly under //the 4MiB mark as the reserved banks can't have an unity mapping to be used by malloc //anymore; we treat them as himem instead. int paddr_start = (4096 * 1024) - (CACHE_BLOCKSIZE * SPIRAM_BANKSWITCH_RESERVE); int paddr_end = maxram; s_ramblockcnt = ((paddr_end - paddr_start) / CACHE_BLOCKSIZE); //Allocate data structures s_ram_descriptor = calloc(s_ramblockcnt, sizeof(ramblock_t)); s_range_descriptor = calloc(SPIRAM_BANKSWITCH_RESERVE, sizeof(rangeblock_t)); if (s_ram_descriptor == NULL || s_range_descriptor == NULL) { ESP_EARLY_LOGE(TAG, "Cannot allocate memory for meta info. Not initializing!"); free(s_ram_descriptor); free(s_range_descriptor); return; } ESP_EARLY_LOGI(TAG, "Initialized. Using last %d 32KB address blocks for bank switching on %d KB of physical memory.", SPIRAM_BANKSWITCH_RESERVE, (paddr_end - paddr_start) / 1024); } #endif //Allocate count not-necessarily consecutive physical RAM blocks, return numbers in blocks[]. Return //true if blocks can be allocated, false if not. static bool allocate_blocks(int count, uint16_t *blocks_out) { int n = 0; for (int i = 0; i < s_ramblockcnt && n != count; i++) { if (!s_ram_descriptor[i].is_alloced) { blocks_out[n] = i; n++; } } if (n == count) { //All blocks could be allocated. Mark as in use. for (int i = 0; i < count; i++) { s_ram_descriptor[blocks_out[i]].is_alloced = true; assert(s_ram_descriptor[blocks_out[i]].is_mapped == false); } return true; } else { //Error allocating blocks return false; } } esp_err_t esp_himem_alloc(size_t size, esp_himem_handle_t *handle_out) { if (size % CACHE_BLOCKSIZE != 0) { return ESP_ERR_INVALID_SIZE; } int blocks = size / CACHE_BLOCKSIZE; esp_himem_ramdata_t *r = calloc(1, sizeof(esp_himem_ramdata_t)); if (!r) { goto nomem; } r->block = calloc(blocks, sizeof(uint16_t)); if (!r->block) { goto nomem; } portENTER_CRITICAL(&spinlock); int ok = allocate_blocks(blocks, r->block); portEXIT_CRITICAL(&spinlock); if (!ok) { goto nomem; } r->block_ct = blocks; *handle_out = r; return ESP_OK; nomem: if (r) { free(r->block); } free(r); return ESP_ERR_NO_MEM; } esp_err_t esp_himem_free(esp_himem_handle_t handle) { //Check if any of the blocks is still mapped; fail if this is the case. for (int i = 0; i < handle->block_ct; i++) { assert(ramblock_idx_valid(handle->block[i])); ESP_RETURN_ON_FALSE(!s_ram_descriptor[handle->block[i]].is_mapped, ESP_ERR_INVALID_ARG, TAG, "block in range still mapped"); } //Mark blocks as free portENTER_CRITICAL(&spinlock); for (int i = 0; i < handle->block_ct; i++) { s_ram_descriptor[handle->block[i]].is_alloced = false; } portEXIT_CRITICAL(&spinlock); //Free handle free(handle->block); free(handle); return ESP_OK; } esp_err_t esp_himem_alloc_map_range(size_t size, esp_himem_rangehandle_t *handle_out) { ESP_RETURN_ON_FALSE(s_ram_descriptor != NULL, ESP_ERR_INVALID_STATE, TAG, "Himem not available!"); ESP_RETURN_ON_FALSE(size % CACHE_BLOCKSIZE == 0, ESP_ERR_INVALID_SIZE, TAG, "requested size not aligned to blocksize"); int blocks = size / CACHE_BLOCKSIZE; esp_himem_rangedata_t *r = calloc(1, sizeof(esp_himem_rangedata_t)); if (!r) { return ESP_ERR_NO_MEM; } r->block_ct = blocks; r->block_start = -1; int start_free = 0; portENTER_CRITICAL(&spinlock); for (int i = 0; i < s_rangeblockcnt; i++) { if (s_range_descriptor[i].is_alloced) { start_free = i + 1; //optimistically assume next block is free... } else if (i - start_free == blocks - 1) { //We found a span of blocks that's big enough to allocate the requested range in. r->block_start = start_free; break; } } if (r->block_start == -1) { //Couldn't find enough free blocks free(r); portEXIT_CRITICAL(&spinlock); return ESP_ERR_NO_MEM; } //Range is found. Mark the blocks as in use. for (int i = 0; i < blocks; i++) { s_range_descriptor[r->block_start + i].is_alloced = 1; } portEXIT_CRITICAL(&spinlock); //All done. *handle_out = r; return ESP_OK; } esp_err_t esp_himem_free_map_range(esp_himem_rangehandle_t handle) { //Check if any of the blocks in the range have a mapping for (int i = 0; i < handle->block_ct; i++) { assert(rangeblock_idx_valid(handle->block_start + i)); assert(s_range_descriptor[i + handle->block_start].is_alloced == 1); //should be, if handle is valid ESP_RETURN_ON_FALSE(!s_range_descriptor[i + handle->block_start].is_mapped, ESP_ERR_INVALID_ARG, TAG, "memory still mapped to range"); } //We should be good to free this. Mark blocks as free. portENTER_CRITICAL(&spinlock); for (int i = 0; i < handle->block_ct; i++) { s_range_descriptor[i + handle->block_start].is_alloced = 0; } portEXIT_CRITICAL(&spinlock); free(handle); return ESP_OK; } esp_err_t esp_himem_map(esp_himem_handle_t handle, esp_himem_rangehandle_t range, size_t ram_offset, size_t range_offset, size_t len, int flags, void **out_ptr) { int ram_block = ram_offset / CACHE_BLOCKSIZE; int range_block = range_offset / CACHE_BLOCKSIZE; int blockcount = len / CACHE_BLOCKSIZE; ESP_RETURN_ON_FALSE(s_ram_descriptor != NULL, ESP_ERR_INVALID_STATE, TAG, "Himem not available!"); //Offsets and length must be block-aligned ESP_RETURN_ON_FALSE(ram_offset % CACHE_BLOCKSIZE == 0, ESP_ERR_INVALID_ARG, TAG, "ram offset not aligned to blocksize"); ESP_RETURN_ON_FALSE(range_offset % CACHE_BLOCKSIZE == 0, ESP_ERR_INVALID_ARG, TAG, "range not aligned to blocksize"); ESP_RETURN_ON_FALSE(len % CACHE_BLOCKSIZE == 0, ESP_ERR_INVALID_ARG, TAG, "length not aligned to blocksize"); //ram and range should be within allocated range ESP_RETURN_ON_FALSE(ram_block + blockcount <= handle->block_ct, ESP_ERR_INVALID_SIZE, TAG, "args not in range of phys ram handle"); ESP_RETURN_ON_FALSE(range_block + blockcount <= range->block_ct, ESP_ERR_INVALID_SIZE, TAG, "args not in range of range handle"); //Check if ram blocks aren't already mapped, and if memory range is unmapped for (int i = 0; i < blockcount; i++) { ESP_RETURN_ON_FALSE(!s_ram_descriptor[handle->block[i + ram_block]].is_mapped, ESP_ERR_INVALID_STATE, TAG, "ram already mapped"); ESP_RETURN_ON_FALSE(!s_range_descriptor[range->block_start + i + range_block].is_mapped, ESP_ERR_INVALID_STATE, TAG, "range already mapped"); } //Map and mark as mapped portENTER_CRITICAL(&spinlock); for (int i = 0; i < blockcount; i++) { assert(ramblock_idx_valid(handle->block[i + ram_block])); s_ram_descriptor[handle->block[i + ram_block]].is_mapped = 1; s_range_descriptor[range->block_start + i + range_block].is_mapped = 1; s_range_descriptor[range->block_start + i + range_block].ram_block = handle->block[i + ram_block]; } portEXIT_CRITICAL(&spinlock); for (int i = 0; i < blockcount; i++) { set_bank(VIRT_HIMEM_RANGE_BLOCKSTART + range->block_start + i + range_block, handle->block[i + ram_block] + PHYS_HIMEM_BLOCKSTART, 1); } //Set out pointer *out_ptr = (void *)(VIRT_HIMEM_RANGE_START + (range->block_start + range_block) * CACHE_BLOCKSIZE); return ESP_OK; } esp_err_t esp_himem_unmap(esp_himem_rangehandle_t range, void *ptr, size_t len) { //Note: doesn't actually unmap, just clears cache and marks blocks as unmapped. //Future optimization: could actually lazy-unmap here: essentially, do nothing and only clear the cache when we reuse //the block for a different physical address. int range_offset = (uint32_t)ptr - VIRT_HIMEM_RANGE_START; int range_block = (range_offset / CACHE_BLOCKSIZE) - range->block_start; int blockcount = len / CACHE_BLOCKSIZE; ESP_RETURN_ON_FALSE(range_offset % CACHE_BLOCKSIZE == 0, ESP_ERR_INVALID_ARG, TAG, "range offset not block-aligned"); ESP_RETURN_ON_FALSE(len % CACHE_BLOCKSIZE == 0, ESP_ERR_INVALID_ARG, TAG, "map length not block-aligned"); ESP_RETURN_ON_FALSE(range_block + blockcount <= range->block_ct, ESP_ERR_INVALID_ARG, TAG, "range out of bounds for handle"); portENTER_CRITICAL(&spinlock); for (int i = 0; i < blockcount; i++) { int ramblock = s_range_descriptor[range->block_start + i + range_block].ram_block; assert(ramblock_idx_valid(ramblock)); s_ram_descriptor[ramblock].is_mapped = 0; s_range_descriptor[range->block_start + i + range_block].is_mapped = 0; } esp_psram_extram_writeback_cache(); portEXIT_CRITICAL(&spinlock); return ESP_OK; }

Details