1 /*
2  * Copyright (c) 2007, Novell Inc.
3  *
4  * This program is licensed under the BSD license, read LICENSE.BSD
5  * for further information
6  */
7 
8 #include <sys/types.h>
9 #include <stdio.h>
10 #include <stdlib.h>
11 #include <string.h>
12 
13 #include "pool.h"
14 #include "repo.h"
15 #define DISABLE_SPLIT
16 #include "tools_util.h"
17 #include "repo_rpmmd.h"
18 #include "chksum.h"
19 #include "solv_xmlparser.h"
20 #ifdef ENABLE_COMPLEX_DEPS
21 #include "pool_parserpmrichdep.h"
22 #endif
23 #include "repodata_diskusage.h"
24 
25 enum state {
26   STATE_START,
27 
28   STATE_SOLVABLE,
29 
30   STATE_NAME,
31   STATE_ARCH,
32   STATE_VERSION,
33 
34   /* package rpm-md */
35   STATE_LOCATION,
36   STATE_CHECKSUM,
37   STATE_RPM_GROUP,
38   STATE_RPM_LICENSE,
39 
40   /* resobject attributes */
41   STATE_SUMMARY,
42   STATE_DESCRIPTION,
43   STATE_DISTRIBUTION,
44   STATE_PACKAGER,
45   STATE_URL,
46   STATE_INSNOTIFY,
47   STATE_DELNOTIFY,
48   STATE_VENDOR,
49   STATE_SIZE,
50   STATE_TIME,
51   STATE_DOWNLOADSIZE,
52   STATE_INSTALLTIME,
53   STATE_INSTALLONLY,
54 
55   /* Novell/SUSE extended attributes */
56   STATE_EULA,
57   STATE_KEYWORD,
58   STATE_DISKUSAGE,
59   STATE_DIRS,
60   STATE_DIR,
61 
62   /* patch */
63   STATE_ID,
64   STATE_TIMESTAMP,
65   STATE_AFFECTSPKG,
66   STATE_REBOOTNEEDED,
67 
68   /* pattern attributes */
69   STATE_CATEGORY, /* pattern and patches */
70   STATE_ORDER,
71   STATE_INCLUDES,
72   STATE_INCLUDESENTRY,
73   STATE_EXTENDS,
74   STATE_EXTENDSENTRY,
75   STATE_SCRIPT,
76   STATE_ICON,
77   STATE_USERVISIBLE,
78   STATE_DEFAULT,
79   STATE_INSTALL_TIME,
80 
81   /* product */
82   STATE_RELNOTESURL,
83   STATE_UPDATEURL,
84   STATE_OPTIONALURL,
85   STATE_FLAG,
86 
87   /* rpm-md dependencies inside the format tag */
88   STATE_PROVIDES,
89   STATE_REQUIRES,
90   STATE_OBSOLETES,
91   STATE_CONFLICTS,
92   STATE_RECOMMENDS,
93   STATE_SUPPLEMENTS,
94   STATE_SUGGESTS,
95   STATE_ENHANCES,
96   STATE_FRESHENS,
97   STATE_SOURCERPM,
98   STATE_HEADERRANGE,
99   STATE_BUILDHOST,
100 
101   STATE_PROVIDESENTRY,
102   STATE_REQUIRESENTRY,
103   STATE_OBSOLETESENTRY,
104   STATE_CONFLICTSENTRY,
105   STATE_RECOMMENDSENTRY,
106   STATE_SUPPLEMENTSENTRY,
107   STATE_SUGGESTSENTRY,
108   STATE_ENHANCESENTRY,
109   STATE_FRESHENSENTRY,
110 
111   STATE_FILE,
112 
113   STATE_CHANGELOG,
114 
115   /* general */
116   NUMSTATES
117 };
118 
119 static struct solv_xmlparser_element stateswitches[] = {
120   /** fake tag used to enclose multiple xml files in one **/
121   { STATE_START,       "rpmmd",           STATE_START,    0 },
122 
123   /** tags for different package data, just ignore them **/
124   { STATE_START,       "patterns",        STATE_START,    0 },
125   { STATE_START,       "products",        STATE_START,    0 },
126   { STATE_START,       "metadata",        STATE_START,    0 },
127   { STATE_START,       "otherdata",       STATE_START,    0 },
128   { STATE_START,       "filelists",       STATE_START,    0 },
129   { STATE_START,       "diskusagedata",   STATE_START,    0 },
130   { STATE_START,       "susedata",        STATE_START,    0 },
131 
132   { STATE_START,       "product",         STATE_SOLVABLE, 0 },
133   { STATE_START,       "pattern",         STATE_SOLVABLE, 0 },
134   { STATE_START,       "patch",           STATE_SOLVABLE, 0 },
135   { STATE_START,       "package",         STATE_SOLVABLE, 0 },
136 
137   { STATE_SOLVABLE,    "format",          STATE_SOLVABLE, 0 },
138 
139   { STATE_SOLVABLE,    "name",            STATE_NAME, 1 },
140   { STATE_SOLVABLE,    "arch",            STATE_ARCH, 1 },
141   { STATE_SOLVABLE,    "version",         STATE_VERSION, 0 },
142 
143   /* package attributes rpm-md */
144   { STATE_SOLVABLE,    "location",        STATE_LOCATION, 0 },
145   { STATE_SOLVABLE,    "checksum",        STATE_CHECKSUM, 1 },
146 
147   /* resobject attributes */
148 
149   { STATE_SOLVABLE,    "summary",         STATE_SUMMARY,      1 },
150   { STATE_SOLVABLE,    "description",     STATE_DESCRIPTION,  1 },
151   { STATE_SOLVABLE,    "distribution",    STATE_DISTRIBUTION, 1 },
152   { STATE_SOLVABLE,    "url",             STATE_URL,          1 },
153   { STATE_SOLVABLE,    "packager",        STATE_PACKAGER,     1 },
154   { STATE_SOLVABLE,    "vendor",          STATE_VENDOR,       1 },
155   { STATE_SOLVABLE,    "size",            STATE_SIZE,         0 },
156   { STATE_SOLVABLE,    "archive-size",    STATE_DOWNLOADSIZE, 1 },
157   { STATE_SOLVABLE,    "install-time",    STATE_INSTALLTIME,  1 },
158   { STATE_SOLVABLE,    "install-only",    STATE_INSTALLONLY,  1 },
159   { STATE_SOLVABLE,    "time",            STATE_TIME,         0 },
160 
161   /* extended Novell/SUSE attributes (susedata.xml) */
162   { STATE_SOLVABLE,    "eula",            STATE_EULA,         1 },
163   { STATE_SOLVABLE,    "keyword",         STATE_KEYWORD,      1 },
164   { STATE_SOLVABLE,    "diskusage",       STATE_DISKUSAGE,    0 },
165 
166   /* pattern attribute */
167   { STATE_SOLVABLE,    "script",          STATE_SCRIPT,        1 },
168   { STATE_SOLVABLE,    "icon",            STATE_ICON,          1 },
169   { STATE_SOLVABLE,    "uservisible",     STATE_USERVISIBLE,   1 },
170   { STATE_SOLVABLE,    "category",        STATE_CATEGORY,      1 },
171   { STATE_SOLVABLE,    "order",           STATE_ORDER,         1 },
172   { STATE_SOLVABLE,    "includes",        STATE_INCLUDES,      0 },
173   { STATE_SOLVABLE,    "extends",         STATE_EXTENDS,       0 },
174   { STATE_SOLVABLE,    "default",         STATE_DEFAULT,       1 },
175   { STATE_SOLVABLE,    "install-time",    STATE_INSTALL_TIME,  1 },
176 
177   /* product attributes */
178   /* note the product type is an attribute */
179   { STATE_SOLVABLE,    "release-notes-url", STATE_RELNOTESURL, 1 },
180   { STATE_SOLVABLE,    "update-url",      STATE_UPDATEURL,   1 },
181   { STATE_SOLVABLE,    "optional-url",    STATE_OPTIONALURL, 1 },
182   { STATE_SOLVABLE,    "flag",            STATE_FLAG,        1 },
183 
184   { STATE_SOLVABLE,    "rpm:vendor",      STATE_VENDOR,      1 },
185   { STATE_SOLVABLE,    "rpm:group",       STATE_RPM_GROUP,   1 },
186   { STATE_SOLVABLE,    "rpm:license",     STATE_RPM_LICENSE, 1 },
187 
188   /* rpm-md dependencies */
189   { STATE_SOLVABLE,    "rpm:provides",    STATE_PROVIDES,     0 },
190   { STATE_SOLVABLE,    "rpm:requires",    STATE_REQUIRES,     0 },
191   { STATE_SOLVABLE,    "rpm:obsoletes",   STATE_OBSOLETES,    0 },
192   { STATE_SOLVABLE,    "rpm:conflicts",   STATE_CONFLICTS,    0 },
193   { STATE_SOLVABLE,    "rpm:recommends",  STATE_RECOMMENDS ,  0 },
194   { STATE_SOLVABLE,    "rpm:supplements", STATE_SUPPLEMENTS,  0 },
195   { STATE_SOLVABLE,    "rpm:suggests",    STATE_SUGGESTS,     0 },
196   { STATE_SOLVABLE,    "rpm:enhances",    STATE_ENHANCES,     0 },
197   { STATE_SOLVABLE,    "rpm:freshens",    STATE_FRESHENS,     0 },
198   { STATE_SOLVABLE,    "rpm:sourcerpm",   STATE_SOURCERPM,    1 },
199   { STATE_SOLVABLE,    "rpm:header-range", STATE_HEADERRANGE, 0 },
200   { STATE_SOLVABLE,    "rpm:buildhost",   STATE_BUILDHOST,    1 },
201   { STATE_SOLVABLE,    "file",            STATE_FILE, 1 },
202   { STATE_SOLVABLE,    "changelog",       STATE_CHANGELOG, 1 },
203 
204    /* extended Novell/SUSE diskusage attributes (susedata.xml) */
205   { STATE_DISKUSAGE,   "dirs",            STATE_DIRS,         0 },
206   { STATE_DIRS,        "dir",             STATE_DIR,          0 },
207 
208   { STATE_PROVIDES,    "rpm:entry",       STATE_PROVIDESENTRY, 0 },
209   { STATE_REQUIRES,    "rpm:entry",       STATE_REQUIRESENTRY, 0 },
210   { STATE_OBSOLETES,   "rpm:entry",       STATE_OBSOLETESENTRY, 0 },
211   { STATE_CONFLICTS,   "rpm:entry",       STATE_CONFLICTSENTRY, 0 },
212   { STATE_RECOMMENDS,  "rpm:entry",       STATE_RECOMMENDSENTRY, 0 },
213   { STATE_SUPPLEMENTS, "rpm:entry",       STATE_SUPPLEMENTSENTRY, 0 },
214   { STATE_SUGGESTS,    "rpm:entry",       STATE_SUGGESTSENTRY, 0 },
215   { STATE_ENHANCES,    "rpm:entry",       STATE_ENHANCESENTRY, 0 },
216   { STATE_FRESHENS,    "rpm:entry",       STATE_FRESHENSENTRY, 0 },
217 
218   { STATE_INCLUDES,    "item",            STATE_INCLUDESENTRY, 0 },
219   { STATE_EXTENDS,     "item",            STATE_EXTENDSENTRY,  0 },
220 
221   { NUMSTATES}
222 };
223 
224 struct parsedata {
225   int ret;
226   Pool *pool;
227   Repo *repo;
228   Repodata *data;
229   char *kind;
230   Solvable *solvable;
231   Offset freshens;
232 
233   struct solv_xmlparser xmlp;
234   struct joindata jd;
235   /* temporal to store attribute tag language */
236   const char *tmplang;
237   Id chksumtype;
238   Id handle;
239   Queue diskusageq;
240   const char *language;			/* default language */
241   Id langcache[ID_NUM_INTERNAL];	/* cache for the default language */
242 
243   Id lastdir;
244   char *lastdirstr;
245   int lastdirstrl;
246 
247   Id changelog_handle;
248 
249   int extending;			/* are we extending an existing solvable? */
250   int first;				/* first solvable we added */
251   int cshash_filled;			/* hash is filled with data */
252 
253   Hashtable cshash;			/* checksum hash -> offset into csdata */
254   Hashval cshashm;			/* hash mask */
255   int ncshash;				/* entries used */
256   unsigned char *csdata;		/* [len, checksum, id] */
257   int ncsdata;				/* used bytes */
258 };
259 
260 static Id
langtag(struct parsedata * pd,Id tag,const char * language)261 langtag(struct parsedata *pd, Id tag, const char *language)
262 {
263   if (language)
264     {
265       if (!language[0] || !strcmp(language, "en"))
266 	return tag;
267       return pool_id2langid(pd->pool, tag, language, 1);
268     }
269   if (!pd->language)
270     return tag;
271   if (tag >= ID_NUM_INTERNAL)
272     return pool_id2langid(pd->pool, tag, pd->language, 1);
273   if (!pd->langcache[tag])
274     pd->langcache[tag] = pool_id2langid(pd->pool, tag, pd->language, 1);
275   return pd->langcache[tag];
276 }
277 
278 /*
279  * makeevr_atts
280  * parse 'epoch', 'ver' and 'rel', return evr Id
281  *
282  */
283 
284 static Id
makeevr_atts(Pool * pool,struct parsedata * pd,const char ** atts)285 makeevr_atts(Pool *pool, struct parsedata *pd, const char **atts)
286 {
287   const char *e, *v, *r, *v2;
288   char *c, *space;
289   int l;
290 
291   e = v = r = 0;
292   for (; *atts; atts += 2)
293     {
294       if (!strcmp(*atts, "epoch"))
295 	e = atts[1];
296       else if (!strcmp(*atts, "ver"))
297 	v = atts[1];
298       else if (!strcmp(*atts, "rel"))
299 	r = atts[1];
300     }
301   if (e && (!*e || !strcmp(e, "0")))
302     e = 0;
303   if (v && !e)
304     {
305       for (v2 = v; *v2 >= '0' && *v2 <= '9'; v2++)
306         ;
307       if (v2 > v && *v2 == ':')
308 	e = "0";
309     }
310   l = 1;
311   if (e)
312     l += strlen(e) + 1;
313   if (v)
314     l += strlen(v);
315   if (r)
316     l += strlen(r) + 1;
317   c = space = solv_xmlparser_contentspace(&pd->xmlp, l);
318   if (e)
319     {
320       strcpy(c, e);
321       c += strlen(c);
322       *c++ = ':';
323     }
324   if (v)
325     {
326       strcpy(c, v);
327       c += strlen(c);
328     }
329   if (r)
330     {
331       *c++ = '-';
332       strcpy(c, r);
333       c += strlen(c);
334     }
335   *c = 0;
336   if (!*space)
337     return 0;
338 #if 0
339   fprintf(stderr, "evr: %s\n", space);
340 #endif
341   return pool_str2id(pool, space, 1);
342 }
343 
344 
345 /*
346  * dependency relations
347  */
348 
349 static char *flagtab[] = {
350   "GT",
351   "EQ",
352   "GE",
353   "LT",
354   "NE",
355   "LE"
356 };
357 
358 
359 /*
360  * adddep
361  * parse attributes to reldep Id
362  *
363  */
364 
365 static unsigned int
adddep(Pool * pool,struct parsedata * pd,unsigned int olddeps,const char ** atts,int isreq)366 adddep(Pool *pool, struct parsedata *pd, unsigned int olddeps, const char **atts, int isreq)
367 {
368   Id id, marker;
369   const char *n, *f, *k;
370   const char **a;
371 
372   n = f = k = 0;
373   marker = isreq ? -SOLVABLE_PREREQMARKER : 0;
374   for (a = atts; *a; a += 2)
375     {
376       if (!strcmp(*a, "name"))
377 	n = a[1];
378       else if (!strcmp(*a, "flags"))
379 	f = a[1];
380       else if (!strcmp(*a, "kind"))
381 	k = a[1];
382       else if (isreq && !strcmp(*a, "pre") && a[1][0] == '1')
383 	marker = SOLVABLE_PREREQMARKER;
384     }
385   if (!n)
386     return olddeps;
387   if (k && !strcmp(k, "package"))
388     k = 0;
389   if (k)
390     {
391       int l = strlen(k) + 1 + strlen(n) + 1;
392       char *space = solv_xmlparser_contentspace(&pd->xmlp, l);
393       sprintf(space, "%s:%s", k, n);
394       id = pool_str2id(pool, space, 1);
395     }
396 #ifdef ENABLE_COMPLEX_DEPS
397   else if (!f && n[0] == '(')
398     {
399       id = pool_parserpmrichdep(pool, n);
400       if (!id)
401 	return olddeps;
402     }
403 #endif
404   else
405     id = pool_str2id(pool, (char *)n, 1);
406   if (f)
407     {
408       Id evr = makeevr_atts(pool, pd, atts);
409       int flags;
410       for (flags = 0; flags < 6; flags++)
411 	if (!strcmp(f, flagtab[flags]))
412 	  break;
413       flags = flags < 6 ? flags + 1 : 0;
414       id = pool_rel2id(pool, id, evr, flags, 1);
415     }
416 #if 0
417   fprintf(stderr, "new dep %s\n", pool_dep2str(pool, id));
418 #endif
419   return repo_addid_dep(pd->repo, olddeps, id, marker);
420 }
421 
422 
423 /*
424  * set_description_author
425  *
426  */
427 static void
set_description_author(Repodata * data,Id handle,char * str,struct parsedata * pd)428 set_description_author(Repodata *data, Id handle, char *str, struct parsedata *pd)
429 {
430   char *aut, *p;
431 
432   if (!str || !*str)
433     return;
434   for (aut = str; (aut = strchr(aut, '\n')) != 0; aut++)
435     if (!strncmp(aut, "\nAuthors:\n--------\n", 19))
436       break;
437   if (aut)
438     {
439       /* oh my, found SUSE special author section */
440       int l = aut - str;
441       str[l] = 0;
442       while (l > 0 && str[l - 1] == '\n')
443 	str[--l] = 0;
444       if (l)
445 	repodata_set_str(data, handle, langtag(pd, SOLVABLE_DESCRIPTION, pd->tmplang), str);
446       p = aut + 19;
447       aut = str;        /* copy over */
448       while (*p == ' ' || *p == '\n')
449 	p++;
450       while (*p)
451 	{
452 	  if (*p == '\n')
453 	    {
454 	      *aut++ = *p++;
455 	      while (*p == ' ')
456 		p++;
457 	      continue;
458 	    }
459 	  *aut++ = *p++;
460 	}
461       while (aut != str && aut[-1] == '\n')
462 	aut--;
463       *aut = 0;
464       if (*str)
465 	repodata_set_str(data, handle, SOLVABLE_AUTHORS, str);
466     }
467   else if (*str)
468     repodata_set_str(data, handle, langtag(pd, SOLVABLE_DESCRIPTION, pd->tmplang), str);
469 }
470 
471 
472 /*-----------------------------------------------*/
473 /* checksum hash functions
474  *
475  * used to look up a solvable with the checksum for solvable extension purposes.
476  *
477  */
478 
479 static void
init_cshash(struct parsedata * pd)480 init_cshash(struct parsedata *pd)
481 {
482 }
483 
484 static void
free_cshash(struct parsedata * pd)485 free_cshash(struct parsedata *pd)
486 {
487   pd->cshash = solv_free(pd->cshash);
488   pd->ncshash = 0;
489   pd->cshashm = 0;
490   pd->csdata = solv_free(pd->csdata);
491   pd->ncsdata = 0;
492 }
493 
494 static inline Hashval
hashkey(const unsigned char * key,int keyl)495 hashkey(const unsigned char *key, int keyl)
496 {
497   return key[0] << 24 | key[1] << 16 | key[2] << 8 | key[3];
498 }
499 
500 static void
rebuild_cshash(struct parsedata * pd)501 rebuild_cshash(struct parsedata *pd)
502 {
503   Hashval h, hh, hm;
504   Hashtable ht;
505   unsigned char *d, *de;
506 
507   hm = pd->cshashm;
508 #if 0
509   fprintf(stderr, "rebuild cshash with mask 0x%x\n", hm);
510 #endif
511   solv_free(pd->cshash);
512   ht = pd->cshash = (Hashtable)solv_calloc(hm + 1, sizeof(Id));
513   d = pd->csdata;
514   de = d + pd->ncsdata;
515   while (d != de)
516     {
517       h = hashkey(d + 1, d[0] + 1) & hm;
518       hh = HASHCHAIN_START;
519       while (ht[h])
520 	h = HASHCHAIN_NEXT(h, hh, hm);
521       ht[h] = d + 1 - pd->csdata;
522       d += 2 + d[0] + sizeof(Id);
523     }
524 }
525 
526 static void
put_in_cshash(struct parsedata * pd,const unsigned char * key,int keyl,Id id)527 put_in_cshash(struct parsedata *pd, const unsigned char *key, int keyl, Id id)
528 {
529   Hashtable ht;
530   Hashval h, hh, hm;
531   unsigned char *d;
532 
533   if (keyl < 4 || keyl > 256)
534     return;
535   ht = pd->cshash;
536   hm = pd->cshashm;
537   h = hashkey(key, keyl) & hm;
538   hh = HASHCHAIN_START;
539   if (ht)
540     {
541       while (ht[h])
542 	{
543 	  unsigned char *d = pd->csdata + ht[h];
544 	  if (d[-1] == keyl - 1 && !memcmp(key, d, keyl))
545 	    return;		/* XXX: first id wins... */
546 	  h = HASHCHAIN_NEXT(h, hh, hm);
547 	}
548     }
549   /* a new entry. put in csdata */
550   pd->csdata = solv_extend(pd->csdata, pd->ncsdata, 1 + keyl + sizeof(Id), 1, 4095);
551   d = pd->csdata + pd->ncsdata;
552   d[0] = keyl - 1;
553   memcpy(d + 1, key, keyl);
554   memcpy(d + 1 + keyl, &id, sizeof(Id));
555   pd->ncsdata += 1 + keyl + sizeof(Id);
556   if ((Hashval)++pd->ncshash * 2 > hm)
557     {
558       pd->cshashm = pd->cshashm ? (2 * pd->cshashm + 1) : 4095;
559       rebuild_cshash(pd);
560     }
561   else
562     ht[h] = pd->ncsdata - (keyl + sizeof(Id));
563 }
564 
565 static Id
lookup_cshash(struct parsedata * pd,const unsigned char * key,int keyl)566 lookup_cshash(struct parsedata *pd, const unsigned char *key, int keyl)
567 {
568   Hashtable ht;
569   Hashval h, hh, hm;
570 
571   if (keyl < 4 || keyl > 256)
572     return 0;
573   ht = pd->cshash;
574   if (!ht)
575     return 0;
576   hm = pd->cshashm;
577   h = hashkey(key, keyl) & hm;
578   hh = HASHCHAIN_START;
579   while (ht[h])
580     {
581       unsigned char *d = pd->csdata + ht[h];
582       if (d[-1] == keyl - 1 && !memcmp(key, d, keyl))
583 	{
584 	  Id id;
585 	  memcpy(&id, d + keyl, sizeof(Id));
586 	  return id;
587 	}
588       h = HASHCHAIN_NEXT(h, hh, hm);
589     }
590   return 0;
591 }
592 
593 static void
fill_cshash_from_repo(struct parsedata * pd)594 fill_cshash_from_repo(struct parsedata *pd)
595 {
596   Dataiterator di;
597   /* setup join data */
598   dataiterator_init(&di, pd->pool, pd->repo, 0, SOLVABLE_CHECKSUM, 0, 0);
599   while (dataiterator_step(&di))
600     put_in_cshash(pd, (const unsigned char *)di.kv.str, solv_chksum_len(di.key->type), di.solvid);
601   dataiterator_free(&di);
602 }
603 
604 static void
fill_cshash_from_new_solvables(struct parsedata * pd)605 fill_cshash_from_new_solvables(struct parsedata *pd)
606 {
607   Pool *pool = pd->pool;
608   int i, l;
609   KeyValue kv;
610   Repokey *key;
611 
612   for (i = pd->first; i < pool->nsolvables; i++)
613     {
614       if (pool->solvables[i].repo != pd->repo)
615 	continue;
616       if ((key = repodata_lookup_kv_uninternalized(pd->data, i, SOLVABLE_CHECKSUM, &kv)) == 0)
617 	continue;
618       if ((l = solv_chksum_len(key->type)) != 0)
619 	put_in_cshash(pd, (const unsigned char *)kv.str, l, i);
620     }
621 }
622 
623 /*-----------------------------------------------*/
624 /* XML callbacks */
625 
626 /*
627  * startElement
628  */
629 
630 static void
startElement(struct solv_xmlparser * xmlp,int state,const char * name,const char ** atts)631 startElement(struct solv_xmlparser *xmlp, int state, const char *name, const char **atts)
632 {
633   struct parsedata *pd = xmlp->userdata;
634   Pool *pool = pd->pool;
635   Solvable *s = pd->solvable;
636   Id handle = pd->handle;
637   const char *str;
638   const char *pkgid;
639 
640   if (!s && state != STATE_SOLVABLE)
641     return;
642 
643   switch(state)
644     {
645     case STATE_SOLVABLE:
646       pd->kind = 0;
647       if (name[2] == 't' && name[3] == 't')
648         pd->kind = "pattern";
649       else if (name[1] == 'r')
650         pd->kind = "product";
651       else if (name[2] == 't' && name[3] == 'c')
652         pd->kind = "patch";
653 
654       /* to support extension metadata files like others.xml which
655          have the following structure:
656 
657          <otherdata xmlns="http://linux.duke.edu/metadata/other"
658                     packages="101">
659            <package pkgid="b78f8664cd90efe42e09a345e272997ef1b53c18"
660                     name="zaptel-kmp-default"
661                     arch="i586"><version epoch="0"
662                     ver="1.2.10_2.6.22_rc4_git6_2" rel="70"/>
663               ...
664 
665          we need to check if the pkgid is there and if it matches
666          an already seen package, that means we don't need to create
667          a new solvable but just append the attributes to the existing
668          one.
669       */
670       pd->extending = 0;
671       if ((pkgid = solv_xmlparser_find_attr("pkgid", atts)) != NULL)
672         {
673 	  unsigned char chk[256];
674 	  int l;
675 	  const char *str = pkgid;
676 	  if (!pd->cshash_filled)
677 	    {
678 	      pd->cshash_filled = 1;
679 	      fill_cshash_from_new_solvables(pd);
680 	    }
681 	  handle = 0;
682 	  /* convert into bin checksum */
683 	  l = solv_hex2bin(&str, chk, sizeof(chk));
684           /* look at the checksum cache */
685 	  if (l >= 4 && !pkgid[2 * l])
686 	    handle = lookup_cshash(pd, chk, l);
687 #if 0
688 	  fprintf(stderr, "Lookup %s -> %d\n", pkgid, handle);
689 #endif
690 	  if (!handle)
691 	    {
692               pool_debug(pool, SOLV_WARN, "the repository specifies extra information about package with checksum '%s', which does not exist in the repository.\n", pkgid);
693 	      pd->handle = 0;
694 	      pd->solvable = 0;
695 	      break;
696 	    }
697 	  pd->extending = 1;
698         }
699       else
700         {
701           /* this is a new package */
702 	  handle = repo_add_solvable(pd->repo);
703 	  if (!pd->first)
704 	    pd->first = handle;
705           pd->freshens = 0;
706         }
707       pd->handle = handle;
708       pd->solvable = pool_id2solvable(pool, handle);
709       if (pd->kind && pd->kind[1] == 'r')
710 	{
711 	  /* products can have a type */
712 	  const char *type = solv_xmlparser_find_attr("type", atts);
713 	  if (type && *type)
714 	    repodata_set_str(pd->data, handle, PRODUCT_TYPE, type);
715 	}
716 #if 0
717       fprintf(stderr, "package #%d\n", pd->solvable - pool->solvables);
718 #endif
719 
720       break;
721     case STATE_VERSION:
722       if (pd->extending && s->evr)
723 	break;		/* ignore version tag repetition in extend data */
724       s->evr = makeevr_atts(pool, pd, atts);
725       break;
726     case STATE_PROVIDES:
727       s->provides = 0;
728       break;
729     case STATE_PROVIDESENTRY:
730       s->provides = adddep(pool, pd, s->provides, atts, 0);
731       break;
732     case STATE_REQUIRES:
733       s->requires = 0;
734       break;
735     case STATE_REQUIRESENTRY:
736       s->requires = adddep(pool, pd, s->requires, atts, 1);
737       break;
738     case STATE_OBSOLETES:
739       s->obsoletes = 0;
740       break;
741     case STATE_OBSOLETESENTRY:
742       s->obsoletes = adddep(pool, pd, s->obsoletes, atts, 0);
743       break;
744     case STATE_CONFLICTS:
745       s->conflicts = 0;
746       break;
747     case STATE_CONFLICTSENTRY:
748       s->conflicts = adddep(pool, pd, s->conflicts, atts, 0);
749       break;
750     case STATE_RECOMMENDS:
751       s->recommends = 0;
752       break;
753     case STATE_RECOMMENDSENTRY:
754       s->recommends = adddep(pool, pd, s->recommends, atts, 0);
755       break;
756     case STATE_SUPPLEMENTS:
757       s->supplements= 0;
758       break;
759     case STATE_SUPPLEMENTSENTRY:
760       s->supplements = adddep(pool, pd, s->supplements, atts, 0);
761       break;
762     case STATE_SUGGESTS:
763       s->suggests = 0;
764       break;
765     case STATE_SUGGESTSENTRY:
766       s->suggests = adddep(pool, pd, s->suggests, atts, 0);
767       break;
768     case STATE_ENHANCES:
769       s->enhances = 0;
770       break;
771     case STATE_ENHANCESENTRY:
772       s->enhances = adddep(pool, pd, s->enhances, atts, 0);
773       break;
774     case STATE_FRESHENS:
775       pd->freshens = 0;
776       break;
777     case STATE_FRESHENSENTRY:
778       pd->freshens = adddep(pool, pd, pd->freshens, atts, 0);
779       break;
780     case STATE_EULA:
781     case STATE_SUMMARY:
782     case STATE_CATEGORY:
783     case STATE_DESCRIPTION:
784       pd->tmplang = join_dup(&pd->jd, solv_xmlparser_find_attr("lang", atts));
785       break;
786     case STATE_USERVISIBLE:
787       repodata_set_void(pd->data, handle, SOLVABLE_ISVISIBLE);
788       break;
789     case STATE_INCLUDESENTRY:
790       str = solv_xmlparser_find_attr("pattern", atts);
791       if (str)
792 	repodata_add_poolstr_array(pd->data, handle, SOLVABLE_INCLUDES, join2(&pd->jd, "pattern", ":", str));
793       break;
794     case STATE_EXTENDSENTRY:
795       str = solv_xmlparser_find_attr("pattern", atts);
796       if (str)
797 	repodata_add_poolstr_array(pd->data, handle, SOLVABLE_EXTENDS, join2(&pd->jd, "pattern", ":", str));
798       break;
799     case STATE_LOCATION:
800       str = solv_xmlparser_find_attr("href", atts);
801       if (str)
802 	{
803 	  int medianr = 0;
804 	  const char *base = solv_xmlparser_find_attr("xml:base", atts);
805 	  if (base  && !strncmp(base, "media:", 6))
806 	    {
807 	      /* check for the media number in the fragment */
808 	      int l = strlen(base);
809 	      while (l && base[l - 1] >= '0' && base[l - 1] <= '9')
810 		l--;
811 	      if (l && base[l - 1] == '#' && base[l])
812 		medianr = atoi(base + l);
813 	    }
814 	  repodata_set_location(pd->data, handle, medianr, 0, str);
815 	  if (base)
816 	    repodata_set_poolstr(pd->data, handle, SOLVABLE_MEDIABASE, base);
817 	}
818       break;
819     case STATE_CHECKSUM:
820       str = solv_xmlparser_find_attr("type", atts);
821       pd->chksumtype = str && *str ? solv_chksum_str2type(str) : 0;
822       if (!pd->chksumtype)
823 	pd->ret = pool_error(pool, -1, "line %d: unknown checksum type: %s", solv_xmlparser_lineno(xmlp), str ? str : "NULL");
824       break;
825     case STATE_TIME:
826       {
827         unsigned int t;
828         str = solv_xmlparser_find_attr("build", atts);
829         if (str && (t = atoi(str)) != 0)
830           repodata_set_num(pd->data, handle, SOLVABLE_BUILDTIME, t);
831 	break;
832       }
833     case STATE_SIZE:
834       if ((str = solv_xmlparser_find_attr("installed", atts)) != 0)
835 	repodata_set_num(pd->data, handle, SOLVABLE_INSTALLSIZE, strtoull(str, 0, 10));
836       if ((str = solv_xmlparser_find_attr("package", atts)) != 0)
837 	repodata_set_num(pd->data, handle, SOLVABLE_DOWNLOADSIZE, strtoull(str, 0, 10));
838       break;
839     case STATE_HEADERRANGE:
840       {
841         unsigned int end;
842         str = solv_xmlparser_find_attr("end", atts);
843 	if (str && (end = atoi(str)) != 0)
844 	  repodata_set_num(pd->data, handle, SOLVABLE_HEADEREND, end);
845 	break;
846       }
847       /*
848         <diskusage>
849           <dirs>
850             <dir name="/" size="56" count="11"/>
851             <dir name="usr/" size="56" count="11"/>
852             <dir name="usr/bin/" size="38" count="10"/>
853             <dir name="usr/share/" size="18" count="1"/>
854             <dir name="usr/share/doc/" size="18" count="1"/>
855           </dirs>
856         </diskusage>
857       */
858     case STATE_DISKUSAGE:
859       {
860         /* Really, do nothing, wait for <dir> tag */
861         break;
862       }
863     case STATE_DIR:
864       {
865         long filesz = 0, filenum = 0;
866         Id did;
867 
868         if ((str = solv_xmlparser_find_attr("name", atts)) == 0)
869 	  {
870 	    pd->ret = pool_error(pool, -1, "<dir .../> tag without 'name' attribute");
871             break;
872 	  }
873 	if (*str != '/')
874 	  {
875 	    if (s->arch == ARCH_SRC || s->arch == ARCH_NOSRC)
876 	      str = "/usr/src";
877 	    else
878 	      {
879 		int l = strlen(str) + 2;
880 		char *space = solv_xmlparser_contentspace(xmlp, l);
881 		space[0] = '/';
882 		memcpy(space + 1, str, l - 1);
883 		str = space;
884 	    }
885 	  }
886         did = repodata_str2dir(pd->data, str, 1);
887         if ((str = solv_xmlparser_find_attr("size", atts)) != 0)
888           filesz = strtol(str, 0, 0);
889         if ((str = solv_xmlparser_find_attr("count", atts)) != 0)
890           filenum = strtol(str, 0, 0);
891         if (filesz || filenum)
892           {
893             queue_push(&pd->diskusageq, did);
894             queue_push2(&pd->diskusageq, filesz, filenum);
895           }
896         break;
897       }
898     case STATE_CHANGELOG:
899       pd->changelog_handle = repodata_new_handle(pd->data);
900       if ((str = solv_xmlparser_find_attr("date", atts)) != 0)
901 	repodata_set_num(pd->data, pd->changelog_handle, SOLVABLE_CHANGELOG_TIME, strtoull(str, 0, 10));
902       if ((str = solv_xmlparser_find_attr("author", atts)) != 0)
903 	repodata_set_str(pd->data, pd->changelog_handle, SOLVABLE_CHANGELOG_AUTHOR, str);
904       break;
905     default:
906       break;
907     }
908 }
909 
910 
911 /*
912  * endElement
913  */
914 
915 static void
endElement(struct solv_xmlparser * xmlp,int state,char * content)916 endElement(struct solv_xmlparser *xmlp, int state, char *content)
917 {
918   struct parsedata *pd = xmlp->userdata;
919   Pool *pool = pd->pool;
920   Solvable *s = pd->solvable;
921   Repo *repo = pd->repo;
922   Id handle = pd->handle;
923   Id id;
924   char *p;
925 
926   if (!s)
927     return;
928 
929   switch (state)
930     {
931     case STATE_SOLVABLE:
932       if (pd->extending)
933 	{
934 	  pd->solvable = 0;
935 	  break;
936 	}
937       if (pd->kind && !s->name) /* add namespace in case of NULL name */
938         s->name = pool_str2id(pool, join2(&pd->jd, pd->kind, ":", 0), 1);
939       if (!s->arch)
940         s->arch = ARCH_NOARCH;
941       if (!s->evr)
942         s->evr = ID_EMPTY;	/* some patterns have this */
943       if (s->name && s->arch != ARCH_SRC && s->arch != ARCH_NOSRC)
944         s->provides = repo_addid_dep(repo, s->provides, pool_rel2id(pool, s->name, s->evr, REL_EQ, 1), 0);
945       repo_rewrite_suse_deps(s, pd->freshens);
946       pd->freshens = 0;
947       pd->kind = 0;
948       pd->solvable = 0;
949       break;
950     case STATE_NAME:
951       if (pd->kind)
952         s->name = pool_str2id(pool, join2(&pd->jd, pd->kind, ":", content), 1);
953       else
954         s->name = pool_str2id(pool, content, 1);
955       break;
956     case STATE_ARCH:
957       s->arch = pool_str2id(pool, content, 1);
958       break;
959     case STATE_VENDOR:
960       s->vendor = pool_str2id(pool, content, 1);
961       break;
962     case STATE_RPM_GROUP:
963       repodata_set_poolstr(pd->data, handle, SOLVABLE_GROUP, content);
964       break;
965     case STATE_RPM_LICENSE:
966       repodata_set_poolstr(pd->data, handle, SOLVABLE_LICENSE, content);
967       break;
968     case STATE_CHECKSUM:
969       {
970 	unsigned char chk[256];
971 	int l = solv_chksum_len(pd->chksumtype);
972 	const char *str = content;
973 	if (!l || l > sizeof(chk))
974 	  break;
975 	if (solv_hex2bin(&str, chk, l) != l || content[2 * l])
976           {
977 	    pd->ret = pool_error(pool, -1, "line %u: invalid %s checksum", solv_xmlparser_lineno(xmlp), solv_chksum_type2str(pd->chksumtype));
978 	    break;
979           }
980         repodata_set_bin_checksum(pd->data, handle, SOLVABLE_CHECKSUM, pd->chksumtype, chk);
981 	/* we save the checksum to solvable id relationship for extending metadata */
982 	if (pd->cshash_filled)
983 	  put_in_cshash(pd, chk, l, s - pool->solvables);
984         break;
985       }
986     case STATE_FILE:
987       if ((p = strrchr(content, '/')) != 0)
988 	{
989 	  *p++ = 0;
990 	  if (pd->lastdir && !strcmp(pd->lastdirstr, content))
991 	    {
992 	      id = pd->lastdir;
993 	    }
994 	  else
995 	    {
996 	      int l = p - content;
997 	      if (l + 1 > pd->lastdirstrl)	/* + 1 for the possible leading / we need to insert */
998 		{
999 		  pd->lastdirstrl = l + 128;
1000 		  pd->lastdirstr = solv_realloc(pd->lastdirstr, pd->lastdirstrl);
1001 		}
1002 	      if (content[0] != '/')
1003 		{
1004 		  pd->lastdirstr[0] = '/';
1005 		  memcpy(pd->lastdirstr + 1, content, l);
1006 	          id = repodata_str2dir(pd->data, pd->lastdirstr, 1);
1007 		}
1008 	      else
1009 	        id = repodata_str2dir(pd->data, content, 1);
1010 	      pd->lastdir = id;
1011 	      memcpy(pd->lastdirstr, content, l);
1012 	    }
1013 	}
1014       else
1015 	{
1016 	  p = content;
1017 	  id = repodata_str2dir(pd->data, "/", 1);
1018 	}
1019       repodata_add_dirstr(pd->data, handle, SOLVABLE_FILELIST, id, p);
1020       break;
1021     case STATE_SUMMARY:
1022       repodata_set_str(pd->data, handle, langtag(pd, SOLVABLE_SUMMARY, pd->tmplang), content);
1023       break;
1024     case STATE_DESCRIPTION:
1025       set_description_author(pd->data, handle, content, pd);
1026       break;
1027     case STATE_CATEGORY:
1028       repodata_set_str(pd->data, handle, langtag(pd, SOLVABLE_CATEGORY, pd->tmplang), content);
1029       break;
1030     case STATE_DISTRIBUTION:
1031         repodata_set_poolstr(pd->data, handle, SOLVABLE_DISTRIBUTION, content);
1032         break;
1033     case STATE_URL:
1034       if (*content)
1035 	repodata_set_str(pd->data, handle, SOLVABLE_URL, content);
1036       break;
1037     case STATE_PACKAGER:
1038       if (*content)
1039 	repodata_set_poolstr(pd->data, handle, SOLVABLE_PACKAGER, content);
1040       break;
1041     case STATE_BUILDHOST:
1042       if (*content)
1043 	repodata_set_str(pd->data, handle, SOLVABLE_BUILDHOST, content);
1044       break;
1045     case STATE_SOURCERPM:
1046       if (*content)
1047 	repodata_set_sourcepkg(pd->data, handle, content);
1048       break;
1049     case STATE_RELNOTESURL:
1050       if (*content)
1051         {
1052           repodata_add_poolstr_array(pd->data, handle, PRODUCT_URL, content);
1053           repodata_add_idarray(pd->data, handle, PRODUCT_URL_TYPE, pool_str2id(pool, "releasenotes", 1));
1054         }
1055       break;
1056     case STATE_UPDATEURL:
1057       if (*content)
1058         {
1059           repodata_add_poolstr_array(pd->data, handle, PRODUCT_URL, content);
1060           repodata_add_idarray(pd->data, handle, PRODUCT_URL_TYPE, pool_str2id(pool, "update", 1));
1061         }
1062       break;
1063     case STATE_OPTIONALURL:
1064       if (*content)
1065         {
1066           repodata_add_poolstr_array(pd->data, handle, PRODUCT_URL, content);
1067           repodata_add_idarray(pd->data, handle, PRODUCT_URL_TYPE, pool_str2id(pool, "optional", 1));
1068         }
1069       break;
1070     case STATE_FLAG:
1071       if (*content)
1072         repodata_add_poolstr_array(pd->data, handle, PRODUCT_FLAGS, content);
1073       break;
1074     case STATE_EULA:
1075       if (*content)
1076 	repodata_set_str(pd->data, handle, langtag(pd, SOLVABLE_EULA, pd->tmplang), content);
1077       break;
1078     case STATE_KEYWORD:
1079       if (*content)
1080         repodata_add_poolstr_array(pd->data, handle, SOLVABLE_KEYWORDS, content);
1081       break;
1082     case STATE_DISKUSAGE:
1083       if (pd->diskusageq.count)
1084         repodata_add_diskusage(pd->data, handle, &pd->diskusageq);
1085       break;
1086     case STATE_ORDER:
1087       if (*content)
1088         repodata_set_str(pd->data, handle, SOLVABLE_ORDER, content);
1089       break;
1090     case STATE_CHANGELOG:
1091       repodata_set_str(pd->data, pd->changelog_handle, SOLVABLE_CHANGELOG_TEXT, content);
1092       repodata_add_flexarray(pd->data, handle, SOLVABLE_CHANGELOG, pd->changelog_handle);
1093       pd->changelog_handle = 0;
1094       break;
1095     default:
1096       break;
1097     }
1098 }
1099 
1100 
1101 /*-----------------------------------------------*/
1102 
1103 /*
1104  * repo_add_rpmmd
1105  * parse rpm-md metadata (primary, others)
1106  *
1107  */
1108 
1109 int
repo_add_rpmmd(Repo * repo,FILE * fp,const char * language,int flags)1110 repo_add_rpmmd(Repo *repo, FILE *fp, const char *language, int flags)
1111 {
1112   Pool *pool = repo->pool;
1113   struct parsedata pd;
1114   Repodata *data;
1115   unsigned int now;
1116 
1117   now = solv_timems(0);
1118   data = repo_add_repodata(repo, flags);
1119 
1120   memset(&pd, 0, sizeof(pd));
1121   pd.pool = pool;
1122   pd.repo = repo;
1123   pd.data = data;
1124 
1125   pd.kind = 0;
1126   pd.language = language && *language && strcmp(language, "en") != 0 ? language : 0;
1127   queue_init(&pd.diskusageq);
1128 
1129   init_cshash(&pd);
1130   if ((flags & REPO_EXTEND_SOLVABLES) != 0)
1131     {
1132       /* setup join data */
1133       pd.cshash_filled = 1;
1134       fill_cshash_from_repo(&pd);
1135     }
1136 
1137   solv_xmlparser_init(&pd.xmlp, stateswitches, &pd, startElement, endElement);
1138   if (solv_xmlparser_parse(&pd.xmlp, fp) != SOLV_XMLPARSER_OK)
1139     pd.ret = pool_error(pool, -1, "repo_rpmmd: %s at line %u:%u", pd.xmlp.errstr, pd.xmlp.line, pd.xmlp.column);
1140   solv_xmlparser_free(&pd.xmlp);
1141 
1142   solv_free(pd.lastdirstr);
1143   join_freemem(&pd.jd);
1144   free_cshash(&pd);
1145   repodata_free_dircache(data);
1146   queue_free(&pd.diskusageq);
1147 
1148   if ((flags & REPO_EXTEND_SOLVABLES) != 0)
1149     {
1150       /* is this a filelist extension? */
1151       if (repodata_has_keyname(data, SOLVABLE_FILELIST))
1152 	repodata_set_filelisttype(data, REPODATA_FILELIST_EXTENSION);
1153     }
1154   else
1155     {
1156       /* is this a primary with a filtered filelist? */
1157       if (data->end > data->start)
1158 	{
1159 	  repodata_set_filelisttype(data, REPODATA_FILELIST_FILTERED);
1160 	  repodata_set_void(data, SOLVID_META, REPOSITORY_FILTEREDFILELIST);
1161 	}
1162     }
1163 
1164   if (!(flags & REPO_NO_INTERNALIZE))
1165     repodata_internalize(data);
1166   POOL_DEBUG(SOLV_DEBUG_STATS, "repo_add_rpmmd took %d ms\n", solv_timems(now));
1167   POOL_DEBUG(SOLV_DEBUG_STATS, "repo size: %d solvables\n", repo->nsolvables);
1168   POOL_DEBUG(SOLV_DEBUG_STATS, "repo memory used: %d K incore, %d K idarray\n", repodata_memused(data)/1024, repo->idarraysize / (int)(1024/sizeof(Id)));
1169   return pd.ret;
1170 }
1171