load.c
author viric@mandarina
Sat, 08 Sep 2007 09:13:15 +0200
changeset 29 84abeba4ef3b
parent 6 bc41369f4587
permissions -rw-r--r--
Removing binary.
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     1
#include <stdio.h>
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     2
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     3
#include "dictre.h"
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     4
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     5
enum
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     6
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     7
    MAX=500000
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     8
};
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
     9
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    10
struct Word words[MAX];
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    11
int nwords;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    12
struct Def defs[MAX];
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    13
int ndefs;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    14
int dont_touch[20];
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    15
int ndont_touch;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    16
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    17
void init_load()
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    18
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    19
    ndefs = 0;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    20
    nwords = 0;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    21
    ndont_touch = 0;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    22
}
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    23
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    24
static void new_word(struct Word *from)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    25
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    26
    memcpy(&words[nwords], from, sizeof(*from));
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    27
    nwords++;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    28
}
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    29
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    30
static void new_dont_touch(int n)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    31
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    32
    dont_touch[ndont_touch++] = n;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    33
}
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    34
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    35
static int new_def(char *def, int offset, int length)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    36
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    37
    defs[ndefs].d = def;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    38
    defs[ndefs].offset = offset;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    39
    defs[ndefs].length = length;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    40
    return ndefs++;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    41
}
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    42
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    43
static int search_def(int offset, int length)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    44
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    45
    int i;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    46
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    47
    for(i=0; i < ndefs; ++i)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    48
    {
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    49
        if (defs[i].offset == offset &&
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    50
                defs[i].length == length)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    51
            return i;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    52
    }
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    53
    return -1;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    54
}
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    55
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    56
static void print_word(struct Word *w)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    57
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    58
    printf("%s\t%i\n", w->w, w->def);
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    59
}
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    60
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    61
void load_dictionary(FILE *index, FILE *fdefs)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    62
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    63
    struct Word w;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    64
    int last_offset = 0;
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    65
    int def_avoided = 0;
6
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
    66
    int numword = 0;;
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
    67
    static int dispnwords = 0;
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    68
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    69
    do {
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    70
        int offset, length;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    71
        char *defstr;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    72
        w.w = get_word(index);
6
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
    73
        /*numword++;
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
    74
        printf("words: %i\n", numword);*/
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    75
        if (w.w == 0)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    76
            break;
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    77
        /*printf("Word: %s\n", w.w);*/
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    78
        offset = get_int(index);
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    79
        length = get_int(index);
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    80
        if (offset > last_offset)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    81
        {
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    82
            w.def = -1;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    83
            last_offset = offset;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    84
        }
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    85
        else
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    86
            w.def = search_def(offset, length);
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    87
        if (w.def == -1) 
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    88
        {
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    89
            /* New definition */
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    90
            int newindex, repindex;
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
    91
            defstr = get_def(fdefs, offset, length);
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    92
            newindex = new_def(defstr, offset, length);
6
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
    93
            /*
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
    94
            printf("Length %i (%s): %i\n", newindex, w.w, length);
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
    95
            */
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    96
            
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    97
            /* Store it in the hash for repeated defs */
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    98
            repindex = def_repeated(&defs[newindex]);
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
    99
            if (repindex != -1) 
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   100
            {
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   101
                def_avoided += 1;
6
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   102
                /*
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   103
                printf("Repeated def avoided %i (for def %i)"
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   104
                        " (%s)\n%i %s\n%i %s\n",
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   105
                        def_avoided, repindex, w.w,
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   106
                        length, defstr,
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   107
                        defs[repindex].length, defs[repindex].d);
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   108
                        */
5
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   109
                remove_def(newindex);
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   110
                newindex = repindex;
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   111
            } else
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   112
                new_hashdef(&defs[newindex], newindex);
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   113
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   114
            /* Store the final index */
c87681fff7d3 Checks for repeated definitions.
viric@mandarina
parents: 2
diff changeset
   115
            w.def = newindex;
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   116
        }
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   117
        /* sizeof -1  instead of strlen() */
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   118
        if (strncmp(w.w, "00database", sizeof("00database") - 1) == 0)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   119
                new_dont_touch(w.def);
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   120
        new_word(&w);
6
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   121
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   122
        /* stdout Display */
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   123
        dispnwords++;
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   124
        if (dispnwords >= 1000)
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   125
        {
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   126
            dispnwords = 0;
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   127
            printf("Loaded: %i Repeated definitions avoided: %i\n", nwords,
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   128
                    def_avoided);
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   129
        }
bc41369f4587 Fixed things in replace.
viric@mandarina
parents: 5
diff changeset
   130
0
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   131
    } while(1);
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   132
}
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   133
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   134
void print_words()
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   135
{
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   136
    int i;
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   137
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   138
    for(i=0; i < nwords; ++i)
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   139
        print_word(&words[i]);
7f37716d4f1e Initial. Awful makefile.
viric@llimona
parents:
diff changeset
   140
}