diff options
| author | Charles.Forsyth <devnull@localhost> | 2006-12-22 21:39:35 +0000 |
|---|---|---|
| committer | Charles.Forsyth <devnull@localhost> | 2006-12-22 21:39:35 +0000 |
| commit | 74a4d8c26dd3c1e9febcb717cfd6cb6512991a7a (patch) | |
| tree | c6e220ba61db3a6ea4052e6841296d829654e664 /utils/rcsh/glob.c | |
| parent | 46439007cf417cbd9ac8049bb4122c890097a0fa (diff) | |
20060303
Diffstat (limited to 'utils/rcsh/glob.c')
| -rw-r--r-- | utils/rcsh/glob.c | 286 |
1 files changed, 286 insertions, 0 deletions
diff --git a/utils/rcsh/glob.c b/utils/rcsh/glob.c new file mode 100644 index 00000000..7640eeb1 --- /dev/null +++ b/utils/rcsh/glob.c @@ -0,0 +1,286 @@ +#include "rc.h" + +char *globname; +Word *globv; + +int matchfn(char *s, char *p); +int globsize(char *p); + +/* + * delete all the GLOB marks from s, in place + */ +void +deglob(char *s) +{ + char *t=s; + do{ + if(*t==GLOB) t++; + *s++=*t; + }while(*t++); +} + +int +globcmp(const void *s, const void *t) +{ + return strcmp(*(char**)s, *(char**)t); +} + +void +globsort(Word *left, Word *right) +{ + char **list; + Word *a; + int n=0; + for(a=left;a!=right;a=a->next) n++; + list=(char **)malloc(n*sizeof(char *)); + for(a=left,n=0;a!=right;a=a->next,n++) list[n]=a->word; + qsort((void*)list, (size_t)n, sizeof(char*), globcmp); + for(a=left,n=0;a!=right;a=a->next,n++) a->word=list[n]; + free(list); +} + +/* + * Push names prefixed by globname and suffixed by a match of p onto the astack. + * namep points to the end of the prefix in globname. + */ +void +globdir(char *p, char *namep) +{ + char *t, *q, *newp; + Direntry *dp, *dq; + Dir *dir; + + /* scan the pattern looking for a component with a metacharacter in it */ + if(*p=='\0'){ + globv=newword(globname, globv); + return; + } + t=namep; + newp=p; + while(*newp){ + if(*newp==GLOB) + break; + *t=*newp++; + if(*t++=='/'){ + namep=t; + p=newp; + } + } + /* If we ran out of pattern, append the name if accessible */ + if(*newp=='\0'){ + *t='\0'; + if(access(globname, 0)==0) + globv=newword(globname, globv); + return; + } + /* read the directory and recur for any entry that matches */ + *namep='\0'; + t = globname; + if(*t == 0) + t = "."; + q = strdup(t); + if (q[strlen(q)-1] == '/') + q[strlen(q)-1] = 0; + if((dir=dirstat(q)) == nil || !(dir->mode&0x80000000)){ + free(dir); + return; + } + free(dir); + dq = readdirect(q); + if(dq == 0){ + fprint(2, "could not open %s: %r\n", q); + return; + } + while(*newp!='/' && *newp!='\0') + newp++; + for(dp = dq;dp->name; dp++){ + strcpy(namep, dp->name); + if(matchfn(namep, p)) + globdir(newp, namep+strlen(namep)); + free(dp->name); + } + free(dq); +} + +/* + * Push all file names matched by p on the current thread's stack. + * If there are no matches, the list consists of p. + */ +void +glob(char *p) +{ + Word *svglobv=globv; + int globlen=globsize(p); + + if(globlen == 0){ + deglob(p); + globv=newword(p, globv); + return; + } + globname=malloc(globlen); + globname[0]='\0'; + globdir(p, globname); + free(globname); + if(svglobv==globv){ + deglob(p); + globv=newword(p, globv); + } + else + globsort(globv, svglobv); +} + + +/* + * Do p and q point at equal utf codes + */ +int +equtf(char *p, char *q) +{ + if(*p!=*q) + return 0; + if(twobyte(*p)) return p[1]==q[1]; + if(threebyte(*p)){ + if(p[1]!=q[1]) return 0; + if(p[1]=='\0') return 1; /* broken code at end of string! */ + return p[2]==q[2]; + } + return 1; +} + +/* + * Return a pointer to the next utf code in the string, + * not jumping past nuls in broken utf codes! + */ +char * +nextutf(char *p) +{ + if(twobyte(*p)) + return p[1]=='\0'?p+1:p+2; + if(threebyte(*p)) + return p[1]=='\0'?p+1:p[2]=='\0'?p+2:p+3; + return p+1; +} + +/* + * Convert the utf code at *p to a unicode value + */ +int +unicode(char *p) +{ + int u=*p&0xff; + if(twobyte(u)) + return ((u&0x1f)<<6)|(p[1]&0x3f); + if(threebyte(u)) + return (u<<12)|((p[1]&0x3f)<<6)|(p[2]&0x3f); + return u; +} + +/* + * Does the string s match the pattern p + * . and .. are only matched by patterns starting with . + * * matches any sequence of characters + * ? matches any single character + * [...] matches the enclosed list of characters + */ +int +matchfn(char *s, char *p) +{ + if(s[0]=='.' && (s[1]=='\0' || s[1]=='.' && s[2]=='\0') && p[0]!='.') + return 0; + return match(s, p, '/'); +} + +int +match(char *s, char *p, int stop) +{ + int compl, hit, lo, hi, t, c; + + for(;*p!=stop && *p!='\0';s=nextutf(s),p=nextutf(p)) { + if(*p!=GLOB){ + if(!equtf(p, s)) return 0; + } + else switch(*++p){ + case GLOB: + if(*s!=GLOB) return 0; + break; + case '*': + for(;;){ + if(match(s, nextutf(p), stop)) return 1; + if(!*s) break; + s=nextutf(s); + } + return 0; + case '?': + if(*s=='\0') return 0; + break; + case '[': + if(*s=='\0') return 0; + c=unicode(s); + p++; + compl=*p=='~'; + if(compl) p++; + hit=0; + while(*p!=']'){ + if(*p=='\0') return 0; /* syntax error */ + lo=unicode(p); + p=nextutf(p); + if(*p!='-') hi=lo; + else{ + p++; + if(*p=='\0') return 0; /* syntax error */ + hi=unicode(p); + p=nextutf(p); + if(hi<lo){ t=lo; lo=hi; hi=t; } + } + if(lo<=c && c<=hi) hit=1; + } + if(compl) hit=!hit; + if(!hit) return 0; + break; + } + } + return *s=='\0'; +} + +void +globlist1(Word *gl) +{ + if(gl){ + globlist1(gl->next); + glob(gl->word); + } +} + +void +globlist(void) +{ + Word *a; + + globv=0; + globlist1(runq->argv->words); + poplist(); + pushlist(); + if(globv){ + for(a=globv;a->next;a=a->next); + a->next=runq->argv->words; + runq->argv->words=globv; + } +} + +#define NDIR 128 +int +globsize(char *p) +{ + ulong isglob=0, globlen=NDIR+1; + + for(;*p;p++){ + if(*p==GLOB){ + p++; + if(*p!=GLOB) isglob++; + globlen+=*p=='*'?NDIR:1; + } + else + globlen++; + } + return isglob?globlen:0; +} |
