/* * parse.cpp: A plugin for the Video Disk Recorder * * See the README file for copyright information and how to reach the author. * */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include "xmltv2vdr.h" #include "parse.h" #include "debug.h" // ------------------------------------------------------- time_t cParse::ConvertXMLTVTime2UnixTime(char *xmltvtime) { time_t offset=0; if (!xmltvtime) return (time_t) 0; char *withtz=strchr(xmltvtime,' '); int len; if (withtz) { len=strlen(xmltvtime)-(withtz-xmltvtime)-1; *withtz=':'; if ((withtz[1]=='+') || (withtz[1]=='-')) { if (len==5) { int val=atoi(&withtz[1]); int h=val/100; int m=val-(h*100); offset=h*3600+m*60; setenv("TZ",":UTC",1); } else { setenv("TZ",":UTC",1); } } else { if (len>2) { setenv("TZ",withtz,1); } else { setenv("TZ",":UTC",1); } } } else { withtz=&xmltvtime[strlen(xmltvtime)]; setenv("TZ",":UTC",1); } tzset(); len=withtz-xmltvtime; if (len<4) { unsetenv("TZ"); tzset(); return (time_t) 0; } len-=2; char fmt[]="%Y%m%d%H%M%S"; fmt[len]=0; struct tm tm; memset(&tm,0,sizeof(tm)); if (!strptime(xmltvtime,fmt,&tm)) { unsetenv("TZ"); tzset(); return (time_t) 0; } if (tm.tm_mday==0) tm.tm_mday=1; time_t ret=mktime(&tm); ret-=offset; unsetenv("TZ"); tzset(); return ret; } void cParse::RemoveNonAlphaNumeric(char *String) { if (!String) return; // remove " Teil " int len=strlen(String); char *p=strstr(String," Teil "); if (p) { memmove(p,p+6,len-6); } // remove non alphanumeric characters len=strlen(String); p=String; int pos=0; while (*p) { // 0x30 - 0x39 // 0x41 - 0x5A // 0x61 - 0x7A if ((*p<0x30) || (*p>0x7a) || (*p>0x39 && *p<0x41) || (*p>0x5A && *p< 0x61)) { memmove(p,p+1,len-pos); len--; continue; } p++; pos++; } // remove leading numbers len=strlen(String); p=String; while (*p) { // 0x30 - 0x39 if ((*p>=0x30) && (*p<=0x39)) { memmove(p,p+1,len); len--; continue; } else { break; } } return; } bool cParse::FetchSeasonEpisode(iconv_t cEP2ASCII, iconv_t cUTF2ASCII, const char *EPDir, const char *Title, const char *ShortText, int &Season, int &Episode) { // Title and ShortText are always UTF8 ! if (!EPDir) return false; if (!ShortText) return false; size_t slen=strlen(ShortText); if (!slen) return false; if (!Title) return false; if (cEP2ASCII==(iconv_t) -1) return false; if (cUTF2ASCII==(iconv_t) -1) return false; DIR *dir=opendir(EPDir); if (!dir) return false; struct dirent dirent_buf,*dirent; bool found=false; for (;;) { if (readdir_r(dir,&dirent_buf,&dirent)!=0) break; if (!dirent) break; if (dirent->d_name[0]=='.') continue; char *pt=strrchr(dirent->d_name,'.'); if (pt) *pt=0; if (!strncasecmp(dirent->d_name,Title,strlen(dirent->d_name))) { found=true; break; } } closedir(dir); if (!found) return false; char *epfile=NULL; if (asprintf(&epfile,"%s/%s.episodes",EPDir,dirent->d_name)==-1) return false; FILE *f=fopen(epfile,"r"); if (!f) { free(epfile); return false; } size_t dlen=4*slen; char *dshorttext=(char *) calloc(dlen,1); if (!dshorttext) { fclose(f); free(epfile); return false; } char *FromPtr=(char *) ShortText; char *ToPtr=(char *) dshorttext; if (iconv(cUTF2ASCII,&FromPtr,&slen,&ToPtr,&dlen)==(size_t) -1) { free(dshorttext); fclose(f); free(epfile); return false; } RemoveNonAlphaNumeric(dshorttext); if (!strlen(dshorttext)) { strcpy(dshorttext,ShortText); // ok lets try with the original text } char *line=NULL; size_t length; found=false; while (getline(&line,&length,f)!=-1) { if (line[0]=='#') continue; char epshorttext[256]=""; char depshorttext[1024]=""; if (sscanf(line,"%3d\t%3d\t%*3d\t%255c",&Season,&Episode,epshorttext)==3) { char *lf=strchr(epshorttext,'\n'); if (lf) *lf=0; slen=strlen(epshorttext); dlen=sizeof(depshorttext); FromPtr=(char *) epshorttext; ToPtr=(char *) depshorttext; if (iconv(cEP2ASCII,&FromPtr,&slen,&ToPtr,&dlen)!=(size_t) -1) { RemoveNonAlphaNumeric(depshorttext); if (!strlen(depshorttext)) { strcpy(depshorttext,epshorttext); // ok lets try with the original text } if (!strncasecmp(dshorttext,depshorttext,strlen(depshorttext))) { found=true; break; } } } } if (!found) { isyslog("failed to find '%s' for '%s' in eplists",ShortText,Title); } if (line) free(line); fclose(f); free(dshorttext); free(epfile); return found; } bool cParse::FetchEvent(xmlNodePtr enode) { char *slang=getenv("LANG"); xmlNodePtr node=enode->xmlChildrenNode; while (node) { if (node->type==XML_ELEMENT_NODE) { if ((!xmlStrcasecmp(node->name, (const xmlChar *) "title"))) { xmlChar *lang=xmlGetProp(node,(const xmlChar *) "lang"); xmlChar *content=xmlNodeListGetString(node->doc,node->xmlChildrenNode,1); if (content) { if (lang && slang && !xmlStrncasecmp(lang, (const xmlChar *) slang,2)) { xevent.SetTitle((const char *) content); } else { if (!xevent.HasTitle()) { xevent.SetTitle((const char *) content); } else { xevent.SetOrigTitle((const char *) content); } } xmlFree(content); } if (lang) xmlFree(lang); } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "sub-title"))) { // what to do with attribute lang? xmlChar *content=xmlNodeListGetString(node->doc,node->xmlChildrenNode,1); if (content) { xevent.SetShortText((const char *) content); xmlFree(content); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "desc"))) { // what to do with attribute lang? xmlChar *content=xmlNodeListGetString(node->doc,node->xmlChildrenNode,1); if (content) { xevent.SetDescription((const char *) content); xmlFree(content); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "credits"))) { xmlNodePtr vnode=node->xmlChildrenNode; while (vnode) { if (vnode->type==XML_ELEMENT_NODE) { if ((!xmlStrcasecmp(vnode->name, (const xmlChar *) "actor"))) { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { xmlChar *arole=xmlGetProp(node,(const xmlChar *) "actor role"); xevent.AddCredits((const char *) vnode->name,(const char *) content,(const char *) arole); if (arole) xmlFree(arole); xmlFree(content); } } else { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { xevent.AddCredits((const char *) vnode->name,(const char *) content); xmlFree(content); } } } vnode=vnode->next; } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "date"))) { xmlChar *content=xmlNodeListGetString(node->doc,node->xmlChildrenNode,1); if (content) { xevent.SetYear(atoi((const char *) content)); xmlFree(content); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "category"))) { // what to do with attribute lang? xmlChar *content=xmlNodeListGetString(node->doc,node->xmlChildrenNode,1); if (content) { if (isdigit(content[0])) { xevent.SetEventID(atoi((const char *) content)); } else { xevent.AddCategory((const char *) content); } xmlFree(content); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "country"))) { xmlChar *content=xmlNodeListGetString(node->doc,node->xmlChildrenNode,1); if (content) { xevent.SetCountry((const char *) content); xmlFree(content); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "video"))) { xmlNodePtr vnode=node->xmlChildrenNode; while (vnode) { if (vnode->type==XML_ELEMENT_NODE) { if ((!xmlStrcasecmp(vnode->name, (const xmlChar *) "colour"))) { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { xevent.AddVideo("colour",(const char *) content); xmlFree(content); } } if ((!xmlStrcasecmp(vnode->name, (const xmlChar *) "aspect"))) { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { xevent.AddVideo("aspect",(const char *) content); xmlFree(content); } } if ((!xmlStrcasecmp(vnode->name, (const xmlChar *) "quality"))) { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { xevent.AddVideo("quality",(const char *) content); xmlFree(content); } } } vnode=vnode->next; } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "audio"))) { xmlNodePtr vnode=node->xmlChildrenNode; while (vnode) { if (vnode->type==XML_ELEMENT_NODE) { if ((!xmlStrcasecmp(vnode->name, (const xmlChar *) "stereo"))) { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { content=(xmlChar*)strreplace((char *)content," ",""); xevent.SetAudio((const char *) content); xmlFree(content); } } } vnode=vnode->next; } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "rating"))) { xmlChar *system=xmlGetProp(node,(const xmlChar *) "system"); if (system) { xmlNodePtr vnode=node->xmlChildrenNode; while (vnode) { if (vnode->type==XML_ELEMENT_NODE) { if ((!xmlStrcasecmp(vnode->name, (const xmlChar *) "value"))) { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { xevent.AddRating((const char *) system,(const char *) content); xmlFree(content); } } } vnode=vnode->next; } xmlFree(system); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "star-rating"))) { xmlChar *system=xmlGetProp(node,(const xmlChar *) "system"); xmlNodePtr vnode=node->xmlChildrenNode; while (vnode) { if (vnode->type==XML_ELEMENT_NODE) { if ((!xmlStrcasecmp(vnode->name, (const xmlChar *) "value"))) { xmlChar *content=xmlNodeListGetString(vnode->doc,vnode->xmlChildrenNode,1); if (content) { xevent.AddStarRating((const char *) system,(const char *) content); xmlFree(content); } } } vnode=vnode->next; } if (system) xmlFree(system); } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "review"))) { xmlChar *type=xmlGetProp(node,(const xmlChar *) "type"); if (type && !xmlStrcasecmp(type, (const xmlChar *) "text")) { xmlChar *content=xmlNodeListGetString(node->doc,node->xmlChildrenNode,1); if (content) { xevent.AddReview((const char *) content); xmlFree(content); } xmlFree(type); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "icon"))) { xmlChar *src=xmlGetProp(node,(const xmlChar *) "src"); if (src) { const xmlChar *f=xmlStrstr(src,(const xmlChar *) "://"); if (f) { // url: skip scheme and scheme-specific-part f+=3; } else { // just try it f=src; } struct stat statbuf; if (stat((const char *) f,&statbuf)!=-1) xevent.SetPicExists(); xmlFree(src); } } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "length"))) { // length without advertisements -> just ignore } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "episode-num"))) { // episode-num in not usable format -> just ignore } else if ((!xmlStrcasecmp(node->name, (const xmlChar *) "subtitles"))) { // info about subtitles -> just ignore (till now) } else { esyslogs(source,"unknown element %s, please report!",node->name); } } node=node->next; } int season,episode; if (FetchSeasonEpisode(cep2ascii,cutf2ascii,epdir,xevent.Title(),xevent.ShortText(),season,episode)) { xevent.SetSeason(season); xevent.SetEpisode(episode); } return xevent.HasTitle(); } int cParse::Process(cEPGExecutor &myExecutor,char *buffer, int bufsize) { if (!buffer) return 134; if (!bufsize) return 134; cSchedulesLock *schedulesLock=NULL; const cSchedules *schedules=NULL; int l=0; while (l<300) { if (schedulesLock) delete schedulesLock; schedulesLock = new cSchedulesLock(true,200); // wait up to 60 secs for lock! schedules = cSchedules::Schedules(*schedulesLock); if (!myExecutor.StillRunning()) { delete schedulesLock; isyslogs(source,"request to stop from vdr"); return 0; } if (schedules) break; l++; } dsyslogs(source,"parsing output"); xmlDocPtr xmltv; xmltv=xmlReadMemory(buffer,bufsize,NULL,NULL,0); if (!xmltv) { esyslogs(source,"failed to parse xmltv"); delete schedulesLock; return 141; } xmlNodePtr rootnode=xmlDocGetRootElement(xmltv); if (!rootnode) { esyslogs(source,"no rootnode in xmltv"); xmlFreeDoc(xmltv); delete schedulesLock; return 141; } sqlite3 *db=NULL; if (sqlite3_open(epgfile,&db)!=SQLITE_OK) { esyslogs(source,"failed to open or create %s",epgfile); xmlFreeDoc(xmltv); delete schedulesLock; return 141; } char sql[]="CREATE TABLE IF NOT EXISTS epg (" \ "src nvarchar(100), channelid nvarchar(255), eventid int, eiteventid int, "\ "starttime datetime, duration int, title nvarchar(255),origtitle nvarchar(255), "\ "shorttext nvarchar(255), description text, eitdescription text, " \ "country nvarchar(255), year int, " \ "credits text, category text, review text, rating text, " \ "starrating text, video text, audio text, season int, episode int, picexists int," \ "srcidx int," \ "PRIMARY KEY(src, channelid, eventid)" \ ");" \ "CREATE UNIQUE INDEX IF NOT EXISTS idx1 on epg (eventid, src); " \ "CREATE UNIQUE INDEX IF NOT EXISTS idx2 on epg (eventid, channelid); " \ "CREATE UNIQUE INDEX IF NOT EXISTS idx3 on epg (eventid, channelid, src); " \ "CREATE INDEX IF NOT EXISTS idx4 on epg (starttime, title, channelid); " \ "CREATE INDEX IF NOT EXISTS idx5 on epg (starttime, src); " \ "BEGIN"; char *errmsg; if (sqlite3_exec(db,sql,NULL,NULL,&errmsg)!=SQLITE_OK) { esyslogs(source,"createdb: %s",errmsg); sqlite3_free(errmsg); sqlite3_close(db); xmlFreeDoc(xmltv); delete schedulesLock; return 141; } time_t begin=time(NULL)-7200; xmlNodePtr node=rootnode->xmlChildrenNode; int lerr=0; int cnt=0; while (node) { if (node->type!=XML_ELEMENT_NODE) { node=node->next; continue; } if ((xmlStrcasecmp(node->name, (const xmlChar *) "programme"))) { node=node->next; continue; } xmlChar *channelid=xmlGetProp(node,(const xmlChar *) "channel"); if (!channelid) { if (lerr!=PARSE_NOCHANNELID) esyslogs(source,"missing channelid in xmltv file"); lerr=PARSE_NOCHANNELID; node=node->next; continue; } cEPGMapping *map=maps->GetMap((const char *) channelid); if (!map) { if (lerr!=PARSE_NOMAPPING) esyslogs(source,"no mapping for channelid %s",channelid); lerr=PARSE_NOMAPPING; xmlFree(channelid); node=node->next; continue; } xmlFree(channelid); xmlChar *start,*stop; time_t starttime=(time_t) 0; time_t stoptime=(time_t) 0; start=xmlGetProp(node,(const xmlChar *) "start"); if (start) { starttime=ConvertXMLTVTime2UnixTime((char *) start); if (starttime) { stop=xmlGetProp(node,(const xmlChar *) "stop"); if (stop) { stoptime=ConvertXMLTVTime2UnixTime((char *) stop); xmlFree(stop); } } xmlFree(start); } if (!starttime) { if (lerr!=PARSE_XMLTVERR) esyslogs(source,"no starttime, check xmltv file"); lerr=PARSE_XMLTVERR; node=node->next; continue; } if (starttimenext; continue; } xevent.Clear(); xevent.SetStartTime(starttime); if (stoptime) xevent.SetDuration(stoptime-starttime); if (!FetchEvent(node)) // sets xevent { tsyslogs(source,"failed to fetch event"); node=node->next; continue; } for (int i=0; iNumChannelIDs(); i++) { const char *sql=xevent.GetSQL(source->Name(),source->Index(),map->ChannelIDs()[i].ToString()); if (sqlite3_exec(db,sql,NULL,NULL,&errmsg)!=SQLITE_OK) { tsyslogs(source,"sqlite3: %s",errmsg); sqlite3_free(errmsg); break; } } cnt++; node=node->next; if (!myExecutor.StillRunning()) { isyslogs(source,"request to stop from vdr"); break; } } dsyslogs(source,"processed %i xmltv events",cnt); if (sqlite3_exec(db,"COMMIT; ANALYZE epg;",NULL,NULL,&errmsg)!=SQLITE_OK) { esyslogs(source,"sqlite3: %s",errmsg); sqlite3_free(errmsg); } sqlite3_close(db); xmlFreeDoc(xmltv); delete schedulesLock; return 0; } void cParse::InitLibXML() { xmlInitParser(); } void cParse::CleanupLibXML() { xmlCleanupParser(); } cParse::cParse(const char *EPGFile, const char *EPDir, cEPGSource *Source, cEPGMappings *Maps) { source=Source; maps=Maps; epgfile=EPGFile; if (EPDir) { epdir=strdup(EPDir); if (!epdir) return; char *charset=strchr((char *) epdir,','); if (charset) { *charset=0; } else { charset=(char *) "UTF-8"; } cep2ascii=iconv_open(charset,"US-ASCII//TRANSLIT"); cutf2ascii=iconv_open("UTF-8","US-ASCII//TRANSLIT"); } else { epdir=NULL; } } cParse::~cParse() { if (epdir) { free((void *) epdir); iconv_close(cep2ascii); iconv_close(cutf2ascii); } }