working parser tm

This commit is contained in:
Maieul BOYER 2024-06-30 18:32:35 +02:00
parent 8d192a0abc
commit 2d88b6af25
No known key found for this signature in database
51 changed files with 33 additions and 31734 deletions

View file

@ -1,50 +1,46 @@
#ifndef TREE_SITTER_UNICODE_H_
#define TREE_SITTER_UNICODE_H_
#ifdef __cplusplus
extern "C" {
#endif
#include <limits.h>
#include <stdint.h>
#include <stdio.h>
#define U_EXPORT
#define U_EXPORT2
#include "unicode/utf8.h"
#include "unicode/utf16.h"
#include "unicode/utf8.h"
static const int32_t TS_DECODE_ERROR = U_SENTINEL;
// These functions read one unicode code point from the given string,
// returning the number of bytes consumed.
typedef uint32_t (*UnicodeDecodeFunction)(
const uint8_t *string,
uint32_t length,
int32_t *code_point
);
typedef uint32_t (*UnicodeDecodeFunction)(const uint8_t *string, uint32_t length, int32_t *code_point);
static inline uint32_t ts_decode_utf8(
const uint8_t *string,
uint32_t length,
int32_t *code_point
) {
uint32_t i = 0;
U8_NEXT(string, i, length, *code_point);
return i;
static inline uint32_t ts_decode_ascii(const uint8_t *string, uint32_t length, int32_t *code_point)
{
(void)(length);
*code_point = 0;
*(uint8_t *)code_point = *string;
return (1);
}
static inline uint32_t ts_decode_utf16(
const uint8_t *string,
uint32_t length,
int32_t *code_point
) {
uint32_t i = 0;
U16_NEXT(((uint16_t *)string), i, length, *code_point);
return i * 2;
static inline uint32_t ts_decode_utf8(const uint8_t *string, uint32_t length, int32_t *code_point)
{
return (ts_decode_ascii(string, length, code_point));
/*
uint32_t i = 0;
U8_NEXT(string, i, length, *code_point);
printf("[UTF8]read %i bytes\n", i);
return i;
*/
}
#ifdef __cplusplus
static inline uint32_t ts_decode_utf16(const uint8_t *string, uint32_t length, int32_t *code_point)
{
uint32_t i = 0;
U16_NEXT(((uint16_t *)string), i, length, *code_point);
printf("[UTF16]read %i bytes\n", i);
return i * 2;
}
#endif
#endif // TREE_SITTER_UNICODE_H_
#endif // TREE_SITTER_UNICODE_H_