Add final state from 2018-10-07
[enwiki-links-graph.git] / links-outgoing-to-incoming.c
diff --git a/links-outgoing-to-incoming.c b/links-outgoing-to-incoming.c
new file mode 100644 (file)
index 0000000..8a23ca7
--- /dev/null
@@ -0,0 +1,89 @@
+#include <assert.h>
+#include <ctype.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+
+
+int main()
+{
+       FILE *in_file;
+       FILE *out_file;
+
+       size_t titles;
+
+       size_t **linko;
+       size_t *linkos;
+
+       size_t **linki;
+       size_t *linkis;
+
+       size_t link_titles_done = 0;
+
+       size_t i;
+
+
+       /*
+        * Read all outgoing links into memory
+        */
+
+       in_file = fopen("links-outgoing.bin", "rb");
+
+       fread(&titles, sizeof(titles), 1, in_file);
+
+       linko = malloc(titles * sizeof(size_t*));
+       linkos = malloc(titles * sizeof(size_t));
+
+       for (i = 0; i < titles; i++) {
+               size_t j;
+
+               fread(&linkos[i], sizeof(linkos[i]), 1, in_file);
+
+               linko[i] = malloc(linkos[i] * sizeof(linko[i][0]));
+
+               for (j = 0; j < linkos[i]; j++) {
+                       fread(&linko[i][j], sizeof(linko[i][j]), 1, in_file);
+               }
+       }
+       fclose(in_file);
+
+       printf("Outgoing links read.\n");
+
+
+
+       linki = malloc(titles * sizeof(size_t*));
+       linkis = malloc(titles * sizeof(size_t));
+
+       for (i = 0; i < titles; i++) {
+               size_t j;
+
+               for (j = 0; j < linkos[i]; j++) {
+                       size_t x = linko[i][j];
+
+                       linkis[x]++;
+                       linki[x] = realloc(linki[x], linkis[x] * sizeof(linki[x][0]));
+
+                       linki[x][linkis[x] - 1] = i;
+               }
+       }
+
+       printf("Links turned upside down.\n");
+
+
+
+       out_file = fopen("links-incoming.bin", "wb");
+       fwrite(&titles, sizeof(titles), 1, out_file);
+       for (i = 0; i < titles; i++) {
+               size_t j;
+
+               fwrite(&linkis[i], sizeof(linkis[i]), 1, out_file);
+
+               for (j = 0; j < linkis[i]; j++) {
+                       fwrite(&linki[i][j], sizeof(linki[i][j]), 1, out_file);
+               }
+       }
+       fclose(out_file);
+
+       printf("Incoming links written.\n");
+}