implemented a lot of stuff

2025-07-21 13:34:20 +03:00
parent 5182a631c1
commit da3367de3f
1 changed files with 69 additions and 14 deletions
--- a/lexer.c
+++ b/lexer.c
@@ -24,14 +24,24 @@ typedef enum{
  TOKEN_MINUS,
  TOKEN_INTEGER,
  TOKEN_SPACE,
  TOKEN_STRING,
  intdef,
  TOKEN_UNKNOWN,
 } symbols;
 typedef enum{
  BHV_STACK,
  BHV_UNDEFINED,
  BHV_NUMBER,
  BHV_STRING,
 } symbol_bhv;
 typedef struct{
  symbols type;
  char* text;
  size_t text_len;
  symbol_bhv behaviour;
  uint cursor_skip;
 } Token;
 typedef struct{
@@ -53,8 +63,12 @@ void lexer_next(Lexer *mylexer){
 Token read_from_tok(char* text, uint cursor){ 
    Token mytoks;
    static char buf[64];
    size_t i = 0;
    mytoks.cursor_skip = 1;
    if (isdigit(text[cursor])) {
        size_t start = cursor;
        while (isdigit(text[cursor])) {
@@ -62,9 +76,23 @@ Token read_from_tok(char* text, uint cursor){
        }
        buf[i] = '\0';
        mytoks.type = TOKEN_INTEGER;
        mytoks.behaviour = BHV_NUMBER;
        mytoks.cursor_skip = cursor - start;
        mytoks.text = buf;
        mytoks.text_len = i;
    } else if (isalpha(text[cursor])){
        size_t start = cursor;
        while (isalpha(text[cursor])) {
            buf[i++] = text[cursor++];
        }
        buf[i] = '\0';
        mytoks.type = TOKEN_STRING;
        mytoks.behaviour = BHV_STRING; 
        mytoks.cursor_skip = cursor - start;
        mytoks.text = buf;
        mytoks.text_len = i;
    }
    else {
       buf[0] = text[cursor];
       buf[1] = '\0';
@@ -73,12 +101,14 @@ Token read_from_tok(char* text, uint cursor){
       switch (text[cursor]){
         case '+':
           mytoks.type = TOKEN_PLUS;
-         // asigning text is not really needed unless for debug
+         // asigning text is not really needed unless for debug. could however be useful for codegen later.
           mytoks.text = "+";
           mytoks.behaviour = BHV_STACK;
                      break;
         case '-':
           mytoks.type = TOKEN_MINUS;
           mytoks.text = "-";
           mytoks.behaviour = BHV_STACK; 
           break;
         case ' ':
           mytoks.type = TOKEN_SPACE;
@@ -86,6 +116,8 @@ Token read_from_tok(char* text, uint cursor){
           break;
         default:
           mytoks.type = TOKEN_UNKNOWN;
           mytoks.behaviour = BHV_UNDEFINED;
    } 
  }
  return mytoks;
@@ -94,22 +126,45 @@ Token read_from_tok(char* text, uint cursor){
 // Token* c
 void parser(Token mytok, char* input){
  int length1 = strlen(input);
  int i=0;
  while (i < length1) {
  mytok = read_from_tok(input, i);
  printf("Text: %s\n", mytok.text);
  printf("Behaviour: %d\n", mytok.behaviour);
      if (mytok.behaviour == BHV_STACK){
         printf("this is stack lil bro\n");
      }
    i++;
  }
 }
 // operators accepted in int/digit or whatever type def only when they have a digit before AND after them 
 /*
 int main(){
  Token newtok;
-  char* input = "32323 + 232";
+  char* input = "8";
  parser(newtok, input);
 }
 */
 int main(){
    Token newtok;
    char* input = "32323 + Hello world";
    int length1 = strlen(input);
    int i = 0;
    while (i < length1) {
        Token result = read_from_tok(input, i);
        printf("text: %s\ntype: %u\n\n", result.text, result.type);
-    if (result.type == TOKEN_INTEGER) {
+        i += result.cursor_skip; 
        i += result.text_len; // to skip the whole integer
    } else {
      i++;
    }
    }
 }