staden-lg/src/indexseqlibs/pirentryname1.c

85 lines
2.0 KiB
C

/* pirentryname1 */
#include <stdio.h>
#include <stdlib.h>
#include <sys/types.h>
#include <string.h>
#define MAXLINE 81 /* maximum input line length*/
/* program to create index for pir library in embl cdrom form */
/* this one gets the entry names and offsets and writes them to an ascii file
this file is sorted, then the next program converts the sorted file to binary
and adds the header */
char patternENTRY[] = "ENTRY";
char patternSEQUENCE[] = "SEQUENCE";
#define patmatch(L,P) (strncmp((L),(P),strlen(P))==0)
int main(int argc, char *argv[])
{
FILE *ifp;
FILE *ofp;
char line[MAXLINE];
char entry_name[10];
off_t entry_offset = 0;
off_t sequence_offset = 0;
long entries_in = 0;
long entries_out = 0;
int leftChar = 16;
printf("pirentryname1 Version 1.0\n");
if (argc != 4) {
fprintf(stderr,"Usage: pirentryname1 filein fileout division\n");
exit(2);
}
if ((ifp = fopen(argv[1],"r")) == NULL) {
fprintf(stderr,"pirentryname1: cannot open input file %s\n",argv[1]);
exit(1);
}
if ((ofp = fopen(argv[2],"w")) == NULL) {
fprintf(stderr,"pirentryname1: cannot open output file %s\n",argv[2]);
exit(1);
}
entry_name[0]='\0';
while (fgets(line,MAXLINE,ifp)!=NULL){
if (patmatch(line, patternENTRY)){
if (*entry_name)
printf("No sequence for entry %-10.10s\n",entry_name);
strncpy(entry_name,&line[leftChar],10);
entry_offset = ftell(ifp) - strlen(line);
entries_in++;
} else if (patmatch(line, patternSEQUENCE) && *entry_name) {
fgets(line, MAXLINE, ifp);
fgets(line, MAXLINE, ifp);
sequence_offset = ftell(ifp) - strlen(line) + 8;
/* 8 = magic offset to first character of sequence */
fprintf(ofp,"%-10.10s %10ld %10ld %-5.5s\n",entry_name,entry_offset,sequence_offset,argv[3]);
entries_out++;
entry_name[0]='\0';
}
}
printf(" Number of entries read = %ld\n",entries_in);
printf(" Number of entries written = %ld\n\n",entries_out);
fclose(ifp);
fclose(ofp);
return 0;
}