X-Git-Url: https://git.llucax.com/z.facultad/75.06/emufs.git/blobdiff_plain/4da22b509af90f905ad13be0b846e41a8d89e3c2..289dcaa6f45429b0c68e1490743b9d73d698678e:/emufs/indice_b.c?ds=sidebyside

diff --git a/emufs/indice_b.c b/emufs/indice_b.c
index 183c6fe..9a5118d 100644
--- a/emufs/indice_b.c
+++ b/emufs/indice_b.c
@@ -1,6 +1,7 @@
 
 #include "indice_b.h"
 #include "common.h"
+#include "emufs.h"
 
 /* Cantidad de claves por nodo */
 #define CANT_HIJOS(x) ((x->tam_bloque-sizeof(B_NodoHeader))/sizeof(B_NodoEntry))
@@ -52,6 +53,11 @@ static void b_pasar_clave_a_derecha(INDICE*, char*, int, char*, int, int, B_Nodo
 static void b_pasar_clave_a_izquierda(INDICE*, char*, int, char*, int, int, B_NodoEntry);
 /** Junta 2 nodos y hace uno solo */
 static void b_fundir_nodo(char *, int, char *, int, char *, int, int);
+			
+static EMUFS_REG_ID b_insertar_dup_en_pos(INDICE *idx, INDICE_DATO pos, INDICE_DATO nuevo);
+
+static void abreviar_claves(INDICE *idx, B_NodoEntry *array, B_NodoHeader *header);
+static void desabreviar_claves(INDICE *idx, B_NodoEntry *array, B_NodoHeader *header);
 
 void emufs_indice_b_crear(INDICE *idx)
 {
@@ -65,8 +71,6 @@ void emufs_indice_b_crear(INDICE *idx)
 	header.hijo_izquierdo = -1;
 
 	fp = fopen(idx->filename, "w");
-	PERR("Creando indice");
-	fprintf(stderr, "Archivo = (%s)\n", idx->filename);
 	if (fp == NULL) {
 		PERR("Error al crear el archivo");
 		return;
@@ -88,6 +92,7 @@ int emufs_indice_b_insertar(INDICE *idx, CLAVE clave, INDICE_DATO dato)
 	B_NodoHeader header;
 	B_NodoEntry *claves;
 	char *nodo, *padre;
+	INDICE_DATO dummy;
 	
 	/* Leo la raiz */
 	nodo = b_leer_nodo(idx, 0);
@@ -102,13 +107,19 @@ int emufs_indice_b_insertar(INDICE *idx, CLAVE clave, INDICE_DATO dato)
 		i=0;
 		while ((i<header.cant) && (emufs_indice_es_menor(idx, claves[i].clave, clave))) i++;
 		if ((i<header.cant) && (emufs_indice_es_igual(idx, claves[i].clave, clave))) {
-			if (idx->tipo == IND_PRIMARIO) {
+			if (idx->funcion == IND_PRIMARIO) {
 				PERR("Indice primario no puede contener claves duplicadas!");
+				PERR(idx->nombre);
 				return 0;
 			}
 			
 			/* TODO : Implementar carga de valor en clave duplicada! */
-			
+			b_insertar_dup_en_pos(idx, claves[i].dato, dato);
+		
+			if (idx->tipo_dato == IDX_STRING) {
+				/* Tengo que sacar el texto repetido del archivo de textos */
+				idx->emu_string->borrar_registro(idx->emu_string, clave);
+			}
 			return 1;
 		} else {
 			if (i == 0) {
@@ -124,6 +135,15 @@ int emufs_indice_b_insertar(INDICE *idx, CLAVE clave, INDICE_DATO dato)
 	if (nodo) free(nodo);
 	nodo = padre;
 	nodo_id = padre_id;
+
+	if (idx->funcion != IND_PRIMARIO) {
+		/* Agrego el DATO real al archivo de claves repetiras
+		 * y me guardo el ID para poner en el indice
+		 */
+		dummy.id = -1;
+		dato.id = b_insertar_dup_en_pos(idx, dummy, dato);
+	}
+
 	b_insertar_en_nodo(idx, clave, dato, nodo_id, nodo, -1, -1);
 	return 1; /* Agregar OK! */
 }
@@ -135,30 +155,30 @@ INDICE_DATO emufs_indice_b_buscar(INDICE *idx, CLAVE clave)
 	B_NodoHeader header;
 	B_NodoEntry *claves;
 	char *nodo, *tmp;
-	
-	if (idx->tipo != IND_PRIMARIO) {
-		/* SOLO SE PUEDE BUSCAR CON CLAVE UNICA! */
-		ret.id = ret.bloque = -1;
-		return ret;
-	}
+	int nodo_id;
 	
 	/* Leo la raiz */
 	nodo = b_leer_nodo(idx, 0);
+	nodo_id = 0;
 	while (nodo) {
 		b_leer_header(nodo, &header);
 		claves = b_leer_claves(nodo, &header);
 		i=0;
 		while ((i<header.cant) && (emufs_indice_es_menor(idx, claves[i].clave, clave))) i++;
-		if (emufs_indice_es_igual(idx, claves[i].clave, clave)) {
+		if ((i<header.cant) && (emufs_indice_es_igual(idx, claves[i].clave, clave))) {
 				ret = claves[i].dato;
+				b_grabar_nodo(idx, nodo_id, nodo);
 				free(nodo);
 				return ret;
 		} else {
 			tmp = nodo;
+			b_grabar_nodo(idx, nodo_id, nodo);
 			if (i == 0) {
 				nodo = b_leer_nodo(idx, header.hijo_izquierdo);
+				nodo_id = header.hijo_izquierdo;
 			} else {
 				nodo = b_leer_nodo(idx, claves[i-1].hijo_derecho);
+				nodo_id = claves[i-1].hijo_derecho;
 			}
 			free(tmp);
 		}
@@ -180,7 +200,6 @@ int emufs_indice_b_borrar(INDICE *idx, CLAVE k)
 
 	nodo_id = 0; /* Tomo la raiz */
 	nodo = b_leer_nodo(idx, nodo_id);
-	PERR("Buscando clave a borrar");
 	while (nodo && !encontrado) {
 		/* Obtengo los datos del nodo */
 		b_leer_header(nodo, &header);
@@ -250,6 +269,8 @@ static char *b_leer_nodo(INDICE *idx, int id)
 {
 	FILE *fp;
 	char *out;
+	B_NodoHeader header;
+	B_NodoEntry *claves;
 
 	if (id < 0) return NULL;
 
@@ -271,6 +292,12 @@ static char *b_leer_nodo(INDICE *idx, int id)
 		return NULL;
 	}
 
+	/* Si estoy manejando string tengo que sacar las abreviaturas */
+	if (idx->tipo_dato == IDX_STRING) {
+		b_leer_header(out, &header);
+		claves = b_leer_claves(out, &header);
+		desabreviar_claves(idx, claves, &header);
+	}
 	fclose(fp);
 	return out;
 }
@@ -278,24 +305,15 @@ static char *b_leer_nodo(INDICE *idx, int id)
 static void b_grabar_nodo(INDICE *idx, int id, char *data)
 {
 	FILE *fp;
+	B_NodoHeader header;
+	B_NodoEntry *claves;
 
-/*	if (id > b_ultimo_id()) {
-		printf("AGREGANDO AL FINAL\n");
-		fp = fopen(FILENAME, "a");
-		if (fp == NULL) {
-		_("No se pudo abrir archivo\n");
-			return;
-		}
-	} else {
-		fp = fopen(FILENAME, "w");
-		if (fp == NULL) {
-		_("No se pudo abrir archivo\n");
-			return;
-		}
-		fseek(fp, id*BLOCK_SIZE, SEEK_SET);
-		printf("SOLO GUARDO DATA\n");
-	}*/
-
+	/* Si las claves son de tipo string debo abreviar antes de guardar */
+	if (idx->tipo_dato == IDX_STRING) {
+		b_leer_header(data, &header);
+		claves = b_leer_claves(data, &header);
+		abreviar_claves(idx, claves, &header);
+	}
 	fp = fopen(idx->filename, "r+");
 	fseek(fp, id*idx->tam_bloque, SEEK_SET);
 	fwrite(data, 1, idx->tam_bloque, fp);
@@ -352,15 +370,25 @@ static void b_insertar_en_nodo(INDICE *idx, CLAVE clave, INDICE_DATO dato, int n
 			i=0;
 			/* Creo una lista ordenada de los nodos a partir */
 			tmp_claves = (B_NodoEntry *)malloc(sizeof(B_NodoEntry)*(nodo_header.cant+1));
-			total = nodo_header.cant;
+			total = nodo_header.cant+1;
 			while ((i<nodo_header.cant) && (emufs_indice_es_menor(idx, claves[i].clave, clave))) {
 				tmp_claves[i] = claves[i];
 				i++;
 			}
 			tmp_claves[i].clave = clave;
 			tmp_claves[i].dato = dato;
-			tmp_claves[i].hijo_derecho = hijo1;
-			tmp_claves[i+1].hijo_derecho = hijo2;
+			/*tmp_claves[i].hijo_derecho = hijo1;*/
+			if (i==0) {
+				nodo_header.hijo_izquierdo = hijo1;
+				tmp_claves[i].hijo_derecho = hijo2;
+			} else {
+				tmp_claves[i-1].hijo_derecho = hijo1;
+				tmp_claves[i].hijo_derecho = hijo2;
+			}
+/*			if (i == 0)
+				nodo_header.hijo_izquierdo = hijo2;
+			else
+				tmp_claves[i+1].hijo_derecho = hijo2;*/
 			while (i < nodo_header.cant) {
 				tmp_claves[i+1] = claves[i];
 				i++;
@@ -370,8 +398,8 @@ static void b_insertar_en_nodo(INDICE *idx, CLAVE clave, INDICE_DATO dato, int n
 			b_leer_header(nuevo, &nuevo_header);
 
 			nuevo_header.nivel = nodo_header.nivel;
-			nodo_header.cant = total/2;
-			nuevo_header.cant = total - nodo_header.cant;
+			nodo_header.cant = total/2-1;
+			nuevo_header.cant = (total-1) - nodo_header.cant;
 
 			memset(claves, '*', idx->tam_bloque-sizeof(B_NodoHeader));
 			for(j=0; j<nodo_header.cant; j++)
@@ -380,14 +408,14 @@ static void b_insertar_en_nodo(INDICE *idx, CLAVE clave, INDICE_DATO dato, int n
 			claves_nuevo = b_leer_claves(nuevo, &nuevo_header);
 			memset(claves_nuevo, '*', idx->tam_bloque-sizeof(B_NodoHeader));
 			for(j=0; j<nuevo_header.cant; j++)
-				claves_nuevo[j] = tmp_claves[j+total/2+1];
+				claves_nuevo[j] = tmp_claves[j+total/2];
 
 			b_actualizar_header(nodo, &nodo_header);
 			b_actualizar_header(nuevo, &nuevo_header);
 
 			if (nodo_id != 0) {
 				clave = tmp_claves[total/2].clave;
-				/* XXX dato.bloque = nuevo_id; */
+				dato = tmp_claves[total/2].dato;
 
 				b_grabar_nodo(idx, nodo_id, nodo);
 				b_grabar_nodo(idx, nuevo_id, nuevo);
@@ -410,7 +438,7 @@ static void b_insertar_en_nodo(INDICE *idx, CLAVE clave, INDICE_DATO dato, int n
 				nodo = tmp_nuevo;
 	
 				clave = tmp_claves[total/2].clave;
-				/* XXX dato.bloque = nuevo_id; */
+				dato = tmp_claves[total/2].dato;
 
 				b_grabar_nodo(idx, nuevo_id+1, nodo);
 				b_grabar_nodo(idx, nuevo_id, nuevo);
@@ -454,15 +482,21 @@ void b_insertar_en_nodo_con_lugar(INDICE *idx, CLAVE clave, INDICE_DATO dato, in
 	claves = b_leer_claves(nodo, &nodo_header);
 	if (nodo_header.cant > 0) {
 		int j;
-		while ((emufs_indice_es_menor(idx, claves[i].clave, clave)) && (i < nodo_header.cant)) i++;
+		while ((i < nodo_header.cant) && (emufs_indice_es_menor(idx, claves[i].clave, clave))) i++;
 		for(j=nodo_header.cant; j > i; j--)
 			claves[j] = claves[j-1];
 	}
 	nodo_header.cant++;
 	claves[i].clave = clave;
 	claves[i].dato = dato;
-	claves[i].hijo_derecho = hijo2;
-	nodo_header.hijo_izquierdo = b_elegir_izquierdo(idx, nodo_header.hijo_izquierdo, hijo1);
+	if (i==0) {
+		nodo_header.hijo_izquierdo = hijo1;
+		claves[i].hijo_derecho = hijo2;
+	} else {
+		claves[i-1].hijo_derecho = hijo1;
+		claves[i].hijo_derecho = hijo2;
+	}
+	/*b_elegir_izquierdo(idx, nodo_header.hijo_izquierdo, hijo1);*/
 
 	b_actualizar_header(nodo, &nodo_header);
 	b_grabar_nodo(idx, nodo_id, nodo);
@@ -523,14 +557,41 @@ static int b_elegir_izquierdo(INDICE *idx, int a, int b)
 
 INDICE_DATO *emufs_indice_b_buscar_muchos(INDICE *idx, CLAVE clave, int *cant)
 {
+	EMUFS_REG_SIZE tam;
+	int error=0;
+	char *leido;
+	CLAVE k;
+	INDICE_DATO dato, *ret;
+
 	/* Si el indice es primario no tiene sentido hacer nada */
 	if (idx->funcion == IND_PRIMARIO) {
 		*cant = 0;
+		PERR("INDICE PRIMARIO NO SOPORTA BUSQUEDA MULTIPLE");
 		return NULL;
 	}
 
-	/* TODO Implementar indices con repeticion */
-	return NULL;
+	/* Busco la clave en el arbol */
+	dato = emufs_indice_b_buscar(idx, clave);
+
+	if (dato.id == -1) {
+		PERR("CLAvE NO ENCONTRADA EN EL ARBOL!");
+	}
+
+	/* Leo el contenido actual */
+	k.i_clave = dato.id;
+	error = 0;
+	leido = (char *)idx->emu_mult->leer_registro(idx->emu_mult, k, &tam, &error);
+
+	/* Incremento en 1 la cantidad */
+	if (leido != NULL)
+		(*cant) = *((int *)leido);
+	else
+		(*cant) = 0;
+
+	ret = malloc(sizeof(INDICE_DATO)*(*cant));
+	memcpy(ret, leido+sizeof(int), (*cant)*sizeof(INDICE_DATO));
+	free(leido);
+	return ret;
 }
 
 static void b_borrar_clave(INDICE *idx, char *nodo, int nodo_id, CLAVE k)
@@ -757,3 +818,141 @@ static void b_fundir_nodo(char *izq, int izq_id, char *padre, int padre_id, char
 {
 }
 
+static EMUFS_REG_ID b_insertar_dup_en_pos(INDICE *idx, INDICE_DATO pos, INDICE_DATO nuevo)
+{
+	int cant;
+	EMUFS_REG_SIZE tam;
+	int error=0;
+	INDICE_DATO *array;
+	char *leido;
+	CLAVE k;
+
+	/* Leo el contenido actual */
+	k.i_clave = pos.id;
+	error = 0;
+	leido = (char *)idx->emu_mult->leer_registro(idx->emu_mult, k, &tam, &error);
+
+	/* Incremento en 1 la cantidad */
+	if (leido != NULL)
+		cant = *((int *)leido);
+	else
+		cant = 0;
+	cant++;
+
+	/* Obtengo un nuevo lugar para el dato nuevo */
+	/* Aca todo bien, si leido es NULL se compota como malloc */
+	leido = realloc(leido, cant*sizeof(INDICE_DATO)+sizeof(int));
+	array = (INDICE_DATO *)(leido+sizeof(int));
+
+	/* Pongo el dato nuevo */
+	array[cant-1] = nuevo;
+
+	/* Actualizo la cantidad */
+	(*((int *)leido)) = cant;
+
+	/* Salvo */
+	if (k.i_clave == -1) {
+		/* Creo uno nuevo */
+		error = 0;
+		k.i_clave = idx->emu_mult->grabar_registro(idx->emu_mult,
+			leido,
+			cant*sizeof(INDICE_DATO)+sizeof(int),
+			&error
+		);
+		if (k.i_clave == -1) PERR("ALGO NO GRABO BIEN!!");
+	} else {
+		/* Modifico el que ya existia! */
+		error = 0;
+		idx->emu_mult->modificar_registro(idx->emu_mult,
+			k.i_clave,
+			leido,
+			cant*sizeof(INDICE_DATO)+sizeof(int),
+			&error
+		);
+	}
+	/* Clean up! */
+	free(leido);
+	return k.i_clave;
+}
+
+char *abreviar(char *primera, char *actual, int *iguales)
+{
+	(*iguales) = 0;
+	while (((*primera) != '\0') && ((*actual) != '\0')) {
+		if ((*primera) == (*actual)) {
+			primera++;
+			actual++;
+			(*iguales)++;
+		} else {
+			/* No coinciden mas! */
+			break;
+		}
+	}
+
+	return actual;
+}
+
+static void abreviar_claves(INDICE *idx, B_NodoEntry *array, B_NodoHeader *header)
+{
+	char *primera, *actual, *resto, salvar[100];
+	EMUFS_REG_SIZE size;
+	int error, i;
+	int iguales;
+
+	/* Agarro la primer clave entera como referencia */
+	primera = (char *)idx->emu_string->leer_registro(idx->emu_string, array[0].clave, &size, &error);
+	for(i=1; i<header->cant; i++) {
+		actual = (char *)idx->emu_string->leer_registro(idx->emu_string, array[i].clave, &size, &error);
+		if (*actual == '*') {
+			free(actual);
+			continue;
+		}
+		resto = abreviar(primera, actual, &iguales);
+		/* Para que tenga sentido abreviar tengo que tener
+		 * mas de 2 letras iguales, si no no gano nada y complica las cosas
+		 */
+		if (iguales > 1) {
+			sprintf(salvar, "%d|%s", iguales, resto);
+			free(actual);
+			error = 0;
+			idx->emu_string->modificar_registro(idx->emu_string, array[i].clave.i_clave, salvar, strlen(salvar)+1, &error);
+		} else {
+			free(primera);
+			primera = actual;
+		}
+	}
+	
+	free(primera);
+}
+
+static void desabreviar_claves(INDICE *idx, B_NodoEntry *array, B_NodoHeader *header)
+{
+	char *primera, *actual, *resto, salvar[100];
+	EMUFS_REG_SIZE size;
+	int error, i;
+	int iguales;
+
+	/* Agarro la primer clave entera como referencia */
+	primera = (char *)idx->emu_string->leer_registro(idx->emu_string, array[0].clave, &size, &error);
+	for(i=1; i<header->cant; i++) {
+		actual = (char *)idx->emu_string->leer_registro(idx->emu_string, array[i].clave, &size, &error);
+		if (*actual == '*') {
+			free(actual);
+			continue;
+		}
+		iguales = strtol(actual, &resto, 10);
+		if ((iguales > 0) && (*resto == '|')) {
+			strncpy(salvar, primera, iguales);
+			salvar[iguales] = '\0';
+			strcat(salvar, resto+1); /* +1 para saltar el separador */
+			idx->emu_string->modificar_registro(idx->emu_string, array[i].clave.i_clave, salvar, strlen(salvar)+1, &error);
+			free(actual);
+		} else {
+			free(primera);
+			primera = actual;
+		}
+	}
+	
+	free(primera);
+}
+