3 * (c) Copyright 1988-1998 by the Massachusetts Institute of Technology.
4 * For copying and distribution information, please see the file
8 #include <mit-copyright.h>
15 EXEC SQL INCLUDE sqlca;
19 EXEC SQL WHENEVER SQLERROR DO dbmserr();
20 int show_user_id(void *user);
21 void handle_duplicate_logins(struct save_queue *sq);
22 void fix_user_id(void *user);
23 void cant_fix(void *id);
24 int show_mach_id(void *machine);
25 int show_mach_name(void *machine);
26 void fix_mach_id(void *machine);
27 int show_snet_name(void *subnet);
28 int show_clu_id(void *cluster);
29 int show_clu_name(void *cluster);
30 void fix_clu_id(void *cluster);
31 int show_list_id(void *list);
32 int show_list_name(void *list);
33 void fix_list_id(void *list);
34 int show_fs_id(void *filesys);
35 void fix_fs_id(void *filesys);
36 int show_fs_name(void *fs);
37 int show_np_id(void *nfsphys);
38 void fix_np_id(void *nfsphys);
39 int show_str_id(void *string);
40 int print_str_id(void *id);
41 void print_dup_map(int key, void *data, void *hint);
43 int show_user_id(void *user)
45 struct user *u = user;
46 printf("User %s (%s, status %d) has duplicate ID\n",
47 u->login, u->fullname, u->status);
51 void handle_duplicate_logins(struct save_queue *sq)
53 struct user *u, *uu, *tmp;
56 if (sq_get_data(sq, &uu))
58 while (sq_get_data(sq, &u))
60 if (!strcmp(u->login, uu->login))
62 if (uu->status == 1 || u->status == 0)
68 printf("User %s (%s, status %d) and\n",
69 u->login, u->fullname, u->status);
70 printf("User %s (%s, status %d) have duplicate logins\n",
71 uu->login, uu->fullname, uu->status);
72 if (!strcmp(u->fullname, uu->fullname) &&
73 single_fix("Delete the second one", 0))
74 single_delete("users", "users_id", uu->users_id);
75 else if (single_fix("Unregister the second one", 0))
77 EXEC SQL BEGIN DECLARE SECTION;
78 int id = uu->users_id, rowcount;
79 EXEC SQL END DECLARE SECTION;
82 SET login = '#' || CHAR(users.unix_uid), status = 0
84 rowcount = sqlca.sqlerrd[2];
87 printf("%d entr%s fixed\n", rowcount,
88 rowcount == 1 ? "y" : "ies");
91 printf("Not fixed\n");
101 void fix_user_id(void *user)
103 struct user *u = user;
104 u->users_id = generic_fix_id("users", "users_id", "login",
105 u->users_id, u->login);
109 void cant_fix(void *id)
111 printf("Sorry, don't know how to fix that\n");
114 int show_mach_id(void *machine)
116 struct machine *m = machine;
117 printf("Machine %s has duplicate ID %d\n", m->name, m->mach_id);
121 int show_mach_name(void *machine)
123 struct machine *m = machine;
124 printf("Machine %s (%d) has duplicate name\n", m->name, m->mach_id);
128 void fix_mach_id(void *machine)
130 struct machine *m = machine;
131 m->mach_id = generic_fix_id("machine", "mach_id", "name",
132 m->mach_id, m->name);
135 int show_snet_name(void *subnet)
137 struct subnet *s = subnet;
138 printf("Subnet %s (%d) has duplicate name\n", s->name, s->snet_id);
142 int show_clu_id(void *cluster)
144 struct cluster *c = cluster;
145 printf("Cluster %s has duplicate ID %d\n", c->name, c->clu_id);
149 int show_clu_name(void *cluster)
151 struct cluster *c = cluster;
152 printf("Cluster %s (%d) has duplicate name\n", c->name, c->clu_id);
156 void fix_clu_id(void *cluster)
158 struct cluster *c = cluster;
159 c->clu_id = generic_fix_id("cluster", "clu_id", "name", c->clu_id, c->name);
162 int show_list_id(void *list)
164 struct list *l = list;
165 printf("List %s has duplicate ID %d\n", l->name, l->list_id);
169 int show_list_name(void *list)
171 struct list *l = list;
172 printf("List %s (%d) has duplicate name\n", l->name, l->list_id);
176 void fix_list_id(void *list)
178 struct list *l = list;
179 l->list_id = generic_fix_id("list", "list_id", "name", l->list_id, l->name);
182 int show_fs_id(void *filesys)
184 struct filesys *f = filesys;
185 printf("Filesys %s has duplicate ID %d\n", f->name, f->filsys_id);
189 void fix_fs_id(void *filesys)
191 struct filesys *f = filesys;
192 f->filsys_id = generic_fix_id("filesys", "filsys_id", "label",
193 f->filsys_id, f->name);
196 int show_fs_name(void *filesys)
198 struct filesys *fs = filesys;
199 printf("Filesys %s (%d) has duplicate name\n", fs->name, fs->filsys_id);
203 int show_np_id(void *nfsphys)
205 struct nfsphys *n = nfsphys;
206 printf("NfsPhys %s:%s has duplicate ID %d\n",
207 ((struct machine *)hash_lookup(machines, n->mach_id))->name,
208 n->dir, n->nfsphys_id);
212 void fix_np_id(void *nfsphys)
214 struct nfsphys *n = nfsphys;
215 n->nfsphys_id = generic_fix_id("nfsphys", "nfsphys_id", "dir",
216 n->nfsphys_id, n->dir);
219 int show_str_id(void *string)
221 struct string *s = string;
222 printf("String %s has duplicate ID %d\n", s->name, s->string_id);
226 int print_str_id(void *id)
228 printf("String %d is a duplicate\n", (int)id);
232 void print_dup_map(int key, void *data, void *hint)
234 printf("String %d is a duplicate of string %d\n", key, (int)data);
239 EXEC SQL BEGIN DECLARE SECTION;
241 EXEC SQL END DECLARE SECTION;
242 int i, q, retval, tmp;
243 struct save_queue *sq;
253 printf("Phase 1 - Looking for duplicates\n");
255 /* self-join strings table on "string" to get duplicate strings, then
256 build a duplicates table to merge them. */
258 dprintf("Looking for duplicate strings...\n");
259 string_dups = create_hash(100);
261 out_of_mem("storing duplicate strings");
263 EXEC SQL DECLARE csr116 CURSOR FOR
264 SELECT s1.string_id, s2.string_id FROM strings s1, strings s2
265 WHERE s1.string = s2.string and s1.string_id < s2.string_id;
266 EXEC SQL OPEN csr116;
267 /* The SELECT gives us two columns, both with non-negative integers.
268 * The number in the left column is always the smaller of the two,
269 * and each row includes string IDs for identical strings. We use
270 * them to make a mapping from id-to-delete to id-to-keep for all
276 EXEC SQL BEGIN DECLARE SECTION;
278 EXEC SQL END DECLARE SECTION;
280 EXEC SQL FETCH csr116 INTO :id1, :id2;
284 /* If id2 is already stored, skip this row. */
285 i = (int)hash_lookup(string_dups, id2);
288 /* Follow the chain of id1 equivalent IDs back to the lowest one. */
290 while ((tmp = (int)hash_lookup(string_dups, id)) > 0)
292 hash_store(string_dups, id2, (void *)id);
294 EXEC SQL CLOSE csr116;
295 dprintf("found %d duplicates\n", q);
296 hash_step(string_dups, print_dup_map, NULL);
297 /* We don't want to delete the duplicates now because if the dbck
298 is cancelled, a LOT of state will be lost. So, we'll just let
299 them not get marked as used and then phase3 will clean them up */
301 dprintf("Loading strings...\n");
303 strings = create_hash(75000);
305 out_of_mem("loading strings");
307 EXEC SQL DECLARE csr101 CURSOR FOR
308 SELECT string_id, string FROM strings ORDER BY string_id;
309 EXEC SQL OPEN csr101;
313 EXEC SQL BEGIN DECLARE SECTION;
315 char buf[STRINGS_STRING_SIZE];
316 EXEC SQL END DECLARE SECTION;
318 EXEC SQL FETCH csr101 INTO :id, :buf;
322 s = malloc(sizeof(struct string));
324 out_of_mem("storing strings");
325 s->name = strdup(strtrim(buf));
328 retval = hash_store(strings, id, s);
330 out_of_mem("storing strings in hash table");
331 else if (retval == 1) /* duplicate string_id */
333 sq_save_data(sq, hash_lookup(strings, id));
337 EXEC SQL CLOSE csr101;
338 /* keep string id 0 (the empty string) even if unreferenced */
341 printf("Loaded %d strings\n", q);
343 dprintf("Loading users...\n");
345 users = create_hash(30000);
347 out_of_mem("loading users");
349 EXEC SQL DECLARE csr102 CURSOR FOR
350 SELECT users_id, login, last, first, status, potype, pop_id, box_id,
351 modby, fmodby, pmodby, comments, sigwho FROM users
353 EXEC SQL OPEN csr102;
356 EXEC SQL BEGIN DECLARE SECTION;
357 char login[USERS_LOGIN_SIZE], nbuf[USERS_FIRST_SIZE + USERS_LAST_SIZE];
358 char last[USERS_LAST_SIZE], first[USERS_FIRST_SIZE];
359 char potype[USERS_POTYPE_SIZE];
360 int users_id, status, pop_id, box_id, modby, fmodby, pmodby;
361 int comments, sigwho;
362 EXEC SQL END DECLARE SECTION;
364 EXEC SQL FETCH csr102 INTO :users_id, :login, :last, :first,
365 :status, :potype, :pop_id, :box_id, :modby, :fmodby, :pmodby,
370 u = malloc(sizeof(struct user));
372 out_of_mem("storing users");
373 strcpy(u->login, strtrim(login));
374 u->potype = potype[0];
375 sprintf(nbuf, "%s, %s", strtrim(last), strtrim(first));
376 u->fullname = strdup(nbuf);
378 u->users_id = users_id;
382 u->comment = comments;
387 u->pobox_id = pop_id;
390 /* If potype is SMTP, box_id is a string_id for the strings tbl */
391 u->pobox_id = box_id;
396 retval = hash_store(users, users_id, u);
398 out_of_mem("storing users in hash table");
399 else if (retval == 1)
401 sq_save_data(sq, hash_lookup(users, users_id));
405 EXEC SQL CLOSE csr102;
407 generic_fix(sq, show_user_id, "Change ID", fix_user_id, 0);
413 out_of_mem("finding duplicate logins");
415 EXEC SQL DECLARE csr103 CURSOR FOR
416 SELECT u1.users_id FROM users u1, users u2
417 WHERE u1.login = u2.login and u1.rowid != u2.rowid;
418 EXEC SQL OPEN csr103;
421 EXEC SQL FETCH csr103 INTO :id;
424 sq_save_data(sq, hash_lookup(users, id));
426 EXEC SQL CLOSE csr103;
427 handle_duplicate_logins(sq);
432 dprintf("Scanning krbmap...\n");
434 EXEC SQL DECLARE csr113 CURSOR FOR
435 SELECT k1.users_id FROM krbmap k1, krbmap k2
436 WHERE k1.users_id = k2.users_id AND k1.rowid != k2.rowid;
437 EXEC SQL OPEN csr113;
440 EXEC SQL FETCH csr113 INTO :id;
444 printf("User %d is in the krbmap more than once!\n", id);
445 printf("Not fixing this error\n");
447 EXEC SQL CLOSE csr113;
449 EXEC SQL DECLARE csr114 CURSOR FOR
450 SELECT k1.string_id FROM krbmap k1, krbmap k2
451 WHERE k1.string_id = k2.string_id AND k1.rowid != k2.rowid;
452 EXEC SQL OPEN csr114;
455 EXEC SQL FETCH csr114 INTO :id;
459 printf("Principal %d is in the krbmap more than once!\n", id);
460 printf("Not fixing this error\n");
462 EXEC SQL CLOSE csr114;
465 dprintf("Loading machines...\n");
467 machines = create_hash(20000);
468 if (!sq || !machines)
469 out_of_mem("loading machines");
471 EXEC SQL DECLARE csr104 CURSOR FOR
472 SELECT mach_id, name, snet_id, owner_type, owner_id,
473 acomment, ocomment, creator, modby
474 FROM machine ORDER BY mach_id;
475 EXEC SQL OPEN csr104;
478 EXEC SQL BEGIN DECLARE SECTION;
479 int mach_id, snet_id, owner_id, acomment, ocomment, creator, modby;
480 char name[MACHINE_NAME_SIZE], owner_type[MACHINE_OWNER_TYPE_SIZE];
481 EXEC SQL END DECLARE SECTION;
483 EXEC SQL FETCH csr104 INTO :mach_id, :name, :snet_id,
484 :owner_type, :owner_id, :acomment, :ocomment, :creator, :modby;
488 m = malloc(sizeof(struct machine));
490 out_of_mem("storing machines");
491 strcpy(m->name, strtrim(name));
492 m->owner_type = owner_type[0];
493 m->owner_id = owner_id;
494 m->snet_id = snet_id;
495 m->mach_id = mach_id;
497 m->acomment = acomment;
498 m->ocomment = ocomment;
499 m->creator = creator;
501 retval = hash_store(machines, mach_id, m);
503 out_of_mem("storing machines in hash table");
504 else if (retval == 1)
506 sq_save_data(sq, hash_lookup(machines, mach_id));
510 EXEC SQL CLOSE csr104;
511 generic_fix(sq, show_mach_id, "Change ID", fix_mach_id, 0);
515 EXEC SQL BEGIN DECLARE SECTION;
516 char name[HOSTALIAS_NAME_SIZE];
518 EXEC SQL END DECLARE SECTION;
522 out_of_mem("looking for duplicate machine names");
524 EXEC SQL DECLARE csr105 CURSOR FOR
525 SELECT m1.mach_id FROM machine m1, machine m2
526 WHERE m1.name = m2.name AND m1.rowid != m2.rowid;
527 EXEC SQL OPEN csr105;
530 EXEC SQL FETCH csr105 INTO :id;
534 sq_save_data(sq, hash_lookup(machines, id));
536 EXEC SQL CLOSE csr105;
537 generic_fix(sq, show_mach_name, "Change name", cant_fix, 0);
539 EXEC SQL DECLARE csr_hal1 CURSOR FOR
540 SELECT h1.name, m1.mach_id, m2.mach_id
541 FROM hostalias h1, machine m1, hostalias h2, machine m2
542 WHERE h1.name = h2.name AND h1.mach_id != h2.mach_id
543 AND m1.mach_id = h1.mach_id AND m2.mach_id = h2.mach_id;
544 EXEC SQL OPEN csr_hal1;
547 EXEC SQL FETCH csr_hal1 INTO :name, :id1, :id2;
550 printf("Aliases for machines %d and %d have duplicate name %s\n",
551 id1, id2, strtrim(name));
554 EXEC SQL CLOSE csr_hal1;
556 EXEC SQL DECLARE csr_hal2 CURSOR FOR
557 SELECT h1.name, m1.mach_id, m2.mach_id
558 FROM hostalias h1, machine m1, machine m2
559 WHERE h1.name = m1.name AND h1.mach_id = m2.mach_id;
560 EXEC SQL OPEN csr_hal2;
563 EXEC SQL FETCH csr_hal2 INTO :name, :id1, :id2;
566 printf("Machine %d has alias %s that conflicts with machine %d\n",
567 id2, strtrim(name), id1);
570 EXEC SQL CLOSE csr_hal2;
573 dprintf("Loading subnets...\n");
574 subnets = create_hash(254);
576 out_of_mem("loading subnets");
578 EXEC SQL DECLARE csr115 CURSOR FOR
579 SELECT snet_id, name, owner_type, owner_id, modby from subnet;
580 EXEC SQL OPEN csr115;
583 EXEC SQL BEGIN DECLARE SECTION;
584 char name[SUBNET_NAME_SIZE], owner_type[SUBNET_OWNER_TYPE_SIZE];
585 int snet_id, owner_id, modby;
586 EXEC SQL END DECLARE SECTION;
588 EXEC SQL FETCH csr115 INTO :snet_id, :name, :owner_type,
593 sn = malloc(sizeof(struct machine));
595 out_of_mem("storing subnets");
596 strcpy(sn->name, strtrim(name));
597 sn->owner_type = owner_type[0];
598 sn->owner_id = owner_id;
599 sn->snet_id = snet_id;
601 retval = hash_store(subnets, snet_id, sn);
603 out_of_mem("storing subnets in hash table");
604 else if (retval == 1)
606 printf("Duplicate subnet ID: %d (%s)\n", id, name);
607 /* should add code to delete */
611 EXEC SQL CLOSE csr115;
617 out_of_mem("looking for duplicate subnet names");
619 EXEC SQL DECLARE csr117 CURSOR FOR
620 SELECT s1.snet_id FROM subnet s1, subnet s2
621 WHERE s1.name = s2.name AND s1.rowid != s2.rowid;
622 EXEC SQL OPEN csr117;
625 EXEC SQL FETCH csr117 INTO :id;
629 sq_save_data(sq, hash_lookup(subnets, id));
631 EXEC SQL CLOSE csr117;
632 generic_fix(sq, show_snet_name, "Change name", cant_fix, 0);
635 dprintf("Loading clusters...\n");
637 clusters = create_hash(100);
638 if (!sq || !clusters)
639 out_of_mem("loading clusters");
641 EXEC SQL DECLARE csr106 CURSOR FOR
642 SELECT clu_id, name, modby FROM clusters;
643 EXEC SQL OPEN csr106;
646 EXEC SQL BEGIN DECLARE SECTION;
648 char name[CLUSTERS_NAME_SIZE];
649 EXEC SQL END DECLARE SECTION;
651 EXEC SQL FETCH csr106 INTO :clu_id, :name, :modby;
655 c = malloc(sizeof(struct cluster));
657 out_of_mem("storing clusters");
658 strcpy(c->name, strtrim(name));
661 retval = hash_store(clusters, clu_id, c);
663 out_of_mem("storing clusters in hash table");
664 else if (retval == 1)
666 sq_save_data(sq, hash_lookup(clusters, clu_id));
670 EXEC SQL CLOSE csr106;
671 generic_fix(sq, show_clu_id, "Change ID", fix_clu_id, 0);
677 out_of_mem("looking for duplicate cluster names");
679 EXEC SQL DECLARE csr107 CURSOR FOR
680 SELECT c1.clu_id FROM clusters c1, clusters c2
681 WHERE c1.name = c2.name AND c1.rowid != c2.rowid;
682 EXEC SQL OPEN csr107;
685 EXEC SQL FETCH csr107 INTO :id;
689 sq_save_data(sq, hash_lookup(clusters, id));
691 EXEC SQL CLOSE csr107;
692 generic_fix(sq, show_clu_name, "Change name", cant_fix, 0);
695 dprintf("Loading lists...\n");
697 lists = create_hash(50000);
699 out_of_mem("loading lists");
701 EXEC SQL DECLARE csr108 CURSOR FOR
702 SELECT list_id, name, acl_id, acl_type, modby FROM list
704 EXEC SQL OPEN csr108;
707 EXEC SQL BEGIN DECLARE SECTION;
708 int list_id, acl_id, modby;
709 char name[LIST_NAME_SIZE], acl_type[LIST_ACL_TYPE_SIZE];
710 EXEC SQL END DECLARE SECTION;
712 EXEC SQL FETCH csr108 INTO :list_id, :name, :acl_id, :acl_type, :modby;
715 l = malloc(sizeof(struct list));
717 out_of_mem("storing lists");
718 strcpy(l->name, strtrim(name));
719 l->acl_type = acl_type[0];
721 l->list_id = list_id;
724 retval = hash_store(lists, list_id, l);
726 out_of_mem("storing lists in hash table");
727 else if (retval == 1)
729 sq_save_data(sq, hash_lookup(lists, list_id));
733 EXEC SQL CLOSE csr108;
734 generic_fix(sq, show_list_id, "Change ID", fix_list_id, 0);
740 out_of_mem("looking for duplicate list names");
742 EXEC SQL DECLARE csr109 CURSOR FOR
743 SELECT l1.list_id FROM list l1, list l2
744 WHERE l1.name = l2.name AND l1.rowid != l2.rowid;
745 EXEC SQL OPEN csr109;
748 EXEC SQL FETCH csr109 INTO :id;
752 sq_save_data(sq, hash_lookup(lists, id));
754 EXEC SQL CLOSE csr109;
755 generic_fix(sq, show_list_name, "Change name", cant_fix, 0);
758 dprintf("Loading filesys...\n");
760 filesys = create_hash(30000);
762 out_of_mem("loading filesys");
764 EXEC SQL DECLARE csr110 CURSOR FOR
765 SELECT filsys_id, label, owner, owners, phys_id, mach_id,
766 type, name, modby FROM filesys ORDER BY filsys_id;
767 EXEC SQL OPEN csr110;
770 EXEC SQL BEGIN DECLARE SECTION;
771 int filsys_id, owner, owners, phys_id, mach_id, modby;
772 char label[FILESYS_LABEL_SIZE], type[FILESYS_TYPE_SIZE];
773 char name[FILESYS_NAME_SIZE];
774 EXEC SQL END DECLARE SECTION;
776 EXEC SQL FETCH csr110 INTO :filsys_id, :label, :owner, :owners,
777 :phys_id, :mach_id, :type, :name, :modby;
781 f = malloc(sizeof(struct filesys));
783 out_of_mem("storing filesystems");
784 strcpy(f->name, strtrim(label));
785 strcpy(f->dir, strtrim(name));
786 f->filsys_id = filsys_id;
789 f->phys_id = phys_id;
790 f->mach_id = mach_id;
792 retval = hash_store(filesys, filsys_id, f);
794 out_of_mem("storing filesys in hash table");
795 else if (retval == 1)
797 sq_save_data(sq, hash_lookup(filesys, filsys_id));
801 EXEC SQL CLOSE csr110;
803 generic_fix(sq, show_fs_id, "Change ID", fix_fs_id, 0);
809 out_of_mem("looking for duplicate filesys names");
811 EXEC SQL DECLARE csr118 CURSOR FOR
812 SELECT fs1.filsys_id FROM filesys fs1, filesys fs2
813 WHERE fs1.label = fs2.label AND fs1.rowid != fs2.rowid;
814 EXEC SQL OPEN csr118;
817 EXEC SQL FETCH csr118 INTO :id;
821 sq_save_data(sq, hash_lookup(filesys, id));
823 EXEC SQL CLOSE csr118;
824 generic_fix(sq, show_fs_name, "Change name", cant_fix, 0);
827 dprintf("Loading nfsphys...\n");
829 nfsphys = create_hash(500);
831 out_of_mem("loading nfsphs");
833 EXEC SQL DECLARE csr111 CURSOR FOR
834 SELECT nfsphys_id, dir, mach_id, allocated, modby FROM nfsphys;
835 EXEC SQL OPEN csr111;
838 EXEC SQL BEGIN DECLARE SECTION;
839 int nfsphys_id, mach_id, allocated, modby;
840 char dir[NFSPHYS_DIR_SIZE];
841 EXEC SQL END DECLARE SECTION;
843 EXEC SQL FETCH csr111 INTO :nfsphys_id, :dir, :mach_id,
848 n = malloc(sizeof(struct nfsphys));
850 out_of_mem("storing nfsphys");
851 strcpy(n->dir, strtrim(dir));
852 n->mach_id = mach_id;
853 n->nfsphys_id = nfsphys_id;
854 n->allocated = allocated;
857 retval = hash_store(nfsphys, nfsphys_id, n);
859 out_of_mem("storing nfsphys in hash table");
860 else if (retval == 1)
862 sq_save_data(sq, hash_lookup(nfsphys, nfsphys_id));
866 EXEC SQL CLOSE csr111;
868 generic_fix(sq, show_np_id, "Change ID", fix_np_id, 0);
870 dprintf("Checking printcap...\n");
872 EXEC SQL DECLARE csr119 CURSOR FOR
873 SELECT p1.name FROM printcap p1, printcap p2
874 WHERE p1.name = p2.name AND p1.rowid < p2.rowid;
875 EXEC SQL OPEN csr119;
878 EXEC SQL BEGIN DECLARE SECTION;
879 char name[PRINTCAP_NAME_SIZE];
880 EXEC SQL END DECLARE SECTION;
882 EXEC SQL FETCH csr119 INTO :name;
886 printf("Printer %s has duplicate name\n", name);
889 EXEC SQL CLOSE csr119;