Nuevo--Cinefilo(ES)-Mangafilms(ES)-Terra cine(ES)-ZonaDVD(ES

If you made a script you can offer it to the others here, or ask help to improve it. You can also report here bugs & problems with existing scripts.
Post Reply
legrad
Posts: 109
Joined: 2006-02-11 09:46:06
Location: Lerida-Spain

Nuevo--Cinefilo(ES)-Mangafilms(ES)-Terra cine(ES)-ZonaDVD(ES

Post by legrad »

Para los que pueda interesar aqui posteo estos script,hay una brve descripcion en los mismos

Code: Select all

(***************************************************

Ant Movie Catalog importation script
www.antp.be/software/moviecatalog/

[Infos]
Authors=Legrad
Title=cinefilo
Description=Detalles de cine, con cartel de calidad
Site=www.cinefilo.es
Language=ES
Version=1.0
Requires=3.5.0
Comments=
License=
GetInfo=1

[Options]

***************************************************)

 program Cinefilo;




var
  MovieName: string;
  MovieURL: string;
//------------------------------------------------------------------------------------
function BorraComillas(var S: string): string;
var
   n,len, tag: Integer;
   c: char;
   t: String;
begin
   tag := 0;
   t := '';
   len := length(s);
   for n :=1 to len do
   begin
     c := Copy(s,n,1);
     if c = '''' then
        c := ' ';
        t := t + c;
   end
   s := t;
   result := t;
end;
//---------------------------------------------------------------------
function Acentos(str1: string) :string;
begin
          str1  := AnsiLowerCase(str1);
          str1  := AnsiUpFirstLetter(str1);
          str1 := StringReplace(str1, 'ã¡' , 'á');
          str1 := StringReplace(str1, 'ã©' , 'é');
          str1 := StringReplace(str1, 'ã­', 'í');
          str1 := StringReplace(str1, 'iã³' , 'á');
          str1 := StringReplace(str1, 'Ã￾' , 'á');
          Str1 := StringReplace(Str1, 'ã±', 'ñ');
          Str1 := StringReplace(Str1, 'ã³', 'ó');
          Str1 := StringReplace(Str1, 'ãª', 'é');
          Str1 := StringReplace(Str1, 'ã', 'á');
          Str1 := StringReplace(Str1, 'Â', '');
          Str1 := StringReplace(Str1, '(cine) - cinefilo.es: cartelera de estrenos', '');
          Str1 := StringReplace(Str1, '...', '');
          Str1 := StringReplace(Str1, '(cine) - cinefilo.es: cartelera de', '');
          Str1 := StringReplace(Str1, '(cine) - cinefilo.es: cartelera', '');
          Str1 := StringReplace(Str1, '’', '');
result := str1;
end;

//------------------------------------------------------------------
                              function FindLine(Pattern: string; List: TStringList; StartAt: Integer): Integer;
var
  i: Integer;
begin
  Result := -1;
  if StartAt < 0 then
    StartAt := 0;
  for i := StartAt to List.Count-1 do
    if Pos(Pattern, List.GetString(i)) <> 0 then
    begin
      Result := i;
      Break;
    end;
end;
//------------------------------------------------------------------------------------
                      function TextBetween(var S: string; StartTag: string; EndTag: string): string;
var
  InitialPos: Integer;
begin
  InitialPos := Pos(StartTag, S);
  if InitialPos = 0 then
    result := ''
  else
  begin
    Delete(S, 1, InitialPos + Length(StartTag) - 1);
    InitialPos := Pos(EndTag, S);
    if InitialPos = 0 then
      result := S
    else
    begin
      result := copy(S, 1, InitialPos - 1);
      Delete(S, 1, InitialPos + 1);
    end;
  end;
end;

//------------------------------------------------------------------------------------
                               function DeleteTags(var S: string): string;
var
   n,len, tag: Integer;
   c: char;
   t: String;
begin

   tag := 0;
   t := '';
   len := length(s);

   for n :=1 to len do
   begin
      c := Copy(s,n,1);


      if c = #9 then
         c := ' ';

      if(tag=1) then
      begin
         if(c='>') then tag := 0;
         continue;
      end
      else
      begin
         if(c='<') then
         begin
            tag := 1;
            continue;
         end;
         t := t + c;
      end;
   end
   s := t;
   result := t;
end;


//------------------------------------------------------------------------------------
procedure AnalyzePage(Address: string);
var
  strPage, MovieAddr, MovieTitle, MovieDate, MovieID, Movie: string;
  BeginPos, EndPos: Integer;
  BeginPoss, EndPoss: Integer;
begin
  strPage := GetPage(Address);
  BeginPos := Pos('en el dominio <b>www.cinefilo.es', strPage);
  if(BeginPos > -1)then
    begin
      PickTreeClear;
      Delete(strPage, 1, BeginPos);
      BeginPos := Pos('href="http://www.cinefilo.es/cine-', strPage);
      EndPos := 1;
      while ((BeginPos > 0) and (EndPos > 0)) do

        begin
          Delete(strPage, 1, BeginPos);
          EndPos := Pos('" class', strPage);
          MovieId := Copy(strPage,+34, EndPos-34);
          MovieAddr := 'http://www.cinefilo.es/cine-' + MovieId;
          BeginPoss := Pos(')"',strPage);
          EndPoss := Pos('</h2>', strPage);
          MovieTitle := Copy(strPage,BeginPoss, EndPoss);
          MovieTitle := TextBetween (MovieTitle, '>', '</a>');
          DeleteTags(MovieTitle);
          MovieTitle := Acentos(MovieTitle);
          PickTreeAdd(MovieTitle, MovieAddr);
          BeginPos := Pos('href="http://www.cinefilo.es/cine-', strPage);
          if(Pos('</body>', strPage) < BeginPos) then
           BeginPos := -1;
        end;

    end;
    PickTreeExec(Address)
    AnalyzeMoviePage(Address);
end;
//------------------------------------------------------------------------------------
procedure AnalyzeMoviePage(Address: string);
var
  Page: TStringList;
  LineNr: Integer;
  Line: string;
  Item: string;
  Comments: string;
  Actors: string;
  Directors: string;
  Description: string;


begin
  Description := '';

  // URL
  SetField(fieldURL, Address);

  Page := TStringList.Create;
  Page.Text := GetPage(Address);

  // Titulo traducido
  LineNr := FindLine('  <b>', Page, 0);
  Line := Page.GetString(LineNr);
  Item := TextBetween (Line, '  <b>', '</b>');
  Item  := AnsiLowerCase(Item);
  Item  := AnsiUpFirstLetter(Item );
  HTMLDecode(Item);
  SetField(fieldTranslatedTitle, Trim (Item));

  // Titulo Original
  LineNr := FindLine('en IMDb', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '><b>', '</b>');
    DeleteTags (Item);
    Item  := AnsiLowerCase(Item);
    Item  := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldOriginalTitle, Trim (Item));
  end;
  // Año
  LineNr := FindLine('en IMDb', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '(', ')');
    DeleteTags (Item);
    Item  := AnsiLowerCase(Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldYear, Trim (Item));
  end;
   // Director
  LineNr := FindLine('en IMDb', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, 'busqueda.php?busqueda=', 'title');
    Item := BorraComillas(Item);
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldDirector, Trim (Item));
  end;
  // Nacionalidad
  LineNr := FindLine('Nacionalidad: <font color=', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '#9A9A9A', '</font>');
    Item := BorraComillas(Item);
    DeleteTags (Item);
    Item  := StringReplace(Item , '>', '');
    HTMLDecode(Item);
    SetField(fieldCountry, Trim (Item));
  end;
  // Duracion
  LineNr := FindLine('color / ', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, 'color / ', 'minutos');
    DeleteTags (Item);
    HTMLDecode(Item);
    SetField(fieldLength, Trim (Item));
  end;

// Categoria
  LineNr := FindLine(' minutos / <font color=', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, ' minutos / <font color=', '</font><br>');
    Item := BorraComillas(Item);
    Item  := StringReplace(Item , '>', '');
    Item  := StringReplace(Item , '#9A9A9A', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldCategory, Trim (Item));
  end;
  
  // Reparto
  LineNr := FindLine(' minutos / <font color=', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '</font><br></span><br />', '<br><br><span class=');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldActors, Trim (Item));
  end;
  // productor
  LineNr := FindLine('Produce:</font>', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, 'Produce:</font>', '</span></td>');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldProducer, Trim (Item));
  end;
  
  // sinopsis
 LineNr := FindLine('Sinopsis</td></tr><tr>', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '#000000', '</table>');
    DeleteTags (Item);
    Item := BorraComillas(Item);
    Item  := StringReplace(Item , '>', '');
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldDescription, Trim (Item));
  end;
// Caratula
  LineNr := FindLine('html][img]http://www.index-dvd.com/covers/300/', Page, 0);
  if LineNr <> -1 then
  begin
     Line := Page.GetString(LineNr);
     Item := TextBetween (Line, 'html][img]http://www.index-dvd.com/covers/300/', '[/img][/url]');
     Item:= BorraComillas(Item);
     Item  := StringReplace(Item , '300a', '600a');
     GetPicture ('http://www.index-dvd.com/covers/600/'+Item);
  end;
end;
 //-------------------------------------------------------------------------
begin
       if (CheckVersion(3,5,0)=FALSe) then
   begin
      ShowMessage('Se requiere Ant Movie Catalog versión 3.5 o superior');
      exit;
   end;

   MovieName := GetField(fieldTranslatedTitle);
   if MovieName = '' then
            MovieName := GetField(fieldOriginalTitle);
Input('Cinefilo', 'Buscar:', MovieName);

     if(GetOption('Sin resultado') = 0) then  Input('Cinefilo', 'Buscar:', MovieName);

   AnalyzePage('http://www.google.es/search?num=100&hl=es&as_qdr=all&q=%22' + UrlEncode(MovieName)+'%22+site%3Awww.cinefilo.es&btnG=B%C3%BAsqueda&meta=');
end.


Code: Select all

(***************************************************

Ant Movie Catalog importation script
www.antp.be/software/moviecatalog/

[Infos]
Authors=Legrad
Title=MangaFilms
Description=La mayoria de los films son relativoa a esta distribuidora
Site=
Language=es
Version=1.0
Requires=3.5.0
Comments=
License=
GetInfo=1

[Options]

***************************************************)

 program MangaFilms;




var
  MovieName: string;
  MovieURL: string;
//------------------------------------------------------------------------------------
function BorraComillas(var S: string): string;
var
   n,len, tag: Integer;
   c: char;
   t: String;
begin
   tag := 0;
   t := '';
   len := length(s);
   for n :=1 to len do
   begin
     c := Copy(s,n,1);
     if c = '''' then
        c := ' ';
        t := t + c;
   end
   s := t;
   result := t;
end;
//---------------------------------------------------------------------

function Acentos(str1: string) :string;
begin
          str1  := AnsiLowerCase(str1);
          str1  := AnsiUpFirstLetter(str1);
          str1 := StringReplace(str1, 'ã¡' , 'á');
          str1 := StringReplace(str1, 'ã©' , 'é');
          str1 := StringReplace(str1, 'ã­', 'í');
          str1 := StringReplace(str1, 'iã³' , 'á');
          str1 := StringReplace(str1, 'Ã￾' , 'á');
          Str1 := StringReplace(Str1, 'ã±', 'ñ');
          Str1 := StringReplace(Str1, 'ã³', 'ó');
          Str1 := StringReplace(Str1, 'ãª', 'é');
          Str1 := StringReplace(Str1, 'ã', 'á');
          Str1 := StringReplace(Str1, 'Â', '');
          Str1 := StringReplace(Str1, '’', '');
result := str1;
end;

//------------------------------------------------------------------
                              function FindLine(Pattern: string; List: TStringList; StartAt: Integer): Integer;
var
  i: Integer;
begin
  Result := -1;
  if StartAt < 0 then
    StartAt := 0;
  for i := StartAt to List.Count-1 do
    if Pos(Pattern, List.GetString(i)) <> 0 then
    begin
      Result := i;
      Break;
    end;
end;
//------------------------------------------------------------------------------------
                      function TextBetween(var S: string; StartTag: string; EndTag: string): string;
var
  InitialPos: Integer;
begin
  InitialPos := Pos(StartTag, S);
  if InitialPos = 0 then
    result := ''
  else
  begin
    Delete(S, 1, InitialPos + Length(StartTag) - 1);
    InitialPos := Pos(EndTag, S);
    if InitialPos = 0 then
      result := S
    else
    begin
      result := copy(S, 1, InitialPos - 1);
      Delete(S, 1, InitialPos + 1);
    end;
  end;
end;

//------------------------------------------------------------------------------------
                               function DeleteTags(var S: string): string;
var
   n,len, tag: Integer;
   c: char;
   t: String;
begin

   tag := 0;
   t := '';
   len := length(s);

   for n :=1 to len do
   begin
      c := Copy(s,n,1);


      if c = #9 then
         c := ' ';

      if(tag=1) then
      begin
         if(c='>') then tag := 0;
         continue;
      end
      else
      begin
         if(c='<') then
         begin
            tag := 1;
            continue;
         end;
         t := t + c;
      end;
   end
   s := t;
   result := t;
end;


//------------------------------------------------------------------------------------
procedure AnalyzePage(Address: string);
var
  strPage, MovieAddr, MovieTitle, MovieDate, MovieID, Movie: string;
  BeginPos, EndPos: Integer;
  BeginPoss, EndPoss: Integer;
begin
  strPage := GetPage(Address);
  BeginPos := Pos('en el dominio <b>www.mangafilms.es', strPage);
  if(BeginPos > -1)then
    begin
      PickTreeClear;
      Delete(strPage, 1, BeginPos);
      BeginPos := Pos('href="http://www.mangafilms.es/ficha.php?id=', strPage);
      EndPos := 1;
      while ((BeginPos > 0) and (EndPos > 0)) do

        begin
          Delete(strPage, 1, BeginPos);
          EndPos := Pos('" class', strPage);
          MovieId := Copy(strPage,+44, EndPos-44);
          MovieAddr := 'http://www.mangafilms.es/ficha.php?id=' + MovieId;
          BeginPoss := Pos(')">',strPage);
          EndPoss := Pos('</h2>', strPage);
          MovieTitle := Copy(strPage,BeginPoss, EndPoss);
          MovieTitle := TextBetween (MovieTitle, '|', '</a>');
          DeleteTags(MovieTitle);
          MovieTitle := Acentos(MovieTitle);
          PickTreeAdd(MovieTitle, MovieAddr);
          BeginPos := Pos('href="http://www.mangafilms.es/ficha.php?id=', strPage);
          if(Pos('</body>', strPage) < BeginPos) then
           BeginPos := -1;
        end;

    end;
    PickTreeExec(Address)
    AnalyzeMoviePage(Address);
end;
//------------------------------------------------------------------------------------
procedure AnalyzeMoviePage(Address: string);
var
  Page: TStringList;
  LineNr: Integer;
  Line: string;
  Item: string;
  Comments: string;
  Actors: string;
  Directors: string;
  Description: string;


begin
  Description := '';

  // URL
  SetField(fieldURL, Address);
  Page := TStringList.Create;
  Page.Text := GetPage(Address);

  // Titulo original
  LineNr := FindLine('Título original</td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('Título original</td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<td width="76%">', '</td>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    HTMLDecode(Item);
  SetField(fieldOriginalTitle, Trim (Item));
end;
  // Titulo traducido
  LineNr := FindLine('<title>', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '|', '</title>');
    DeleteTags (Item);
    Item  := AnsiLowerCase(Item);
    Item  := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldTranslatedTitle, Trim (Item));
  end;
 // Nacionalidad
  LineNr := FindLine('>Nacionalidad</td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('>Nacionalidad</td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<td width="76%">', '</td>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    HTMLDecode(Item);
  SetField(fieldCountry, Trim (Item));
end;
   // Director
  LineNr := FindLine('>Dirigida por</td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('>Dirigida por</td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, 'php?b=', '>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    Item  := StringReplace(Item , '%20', ' ');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    HTMLDecode(Item);
    SetField(fieldDirector, Trim (Item));
  end;
  // pais
  LineNr := FindLine('Nacionalidad: <font color=', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '#9A9A9A', '</font>');
    Item := BorraComillas(Item);
    DeleteTags (Item);
    Item  := StringReplace(Item , '>', '');
    HTMLDecode(Item);
    SetField(fieldCountry, Trim (Item));
  end;
  // duracion
  LineNr := FindLine('>Duración</td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('>Duración</td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<td width="76%">', 'min');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    HTMLDecode(Item);
    SetField(fieldLength, Trim (Item));
  end;

  //Año
  LineNr := FindLine('>Año producción</td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('>Año producción</td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<td width="76%">', '</td>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    HTMLDecode(Item);
    SetField(fieldYear, Trim (Item));
  end;
// Categoria
  LineNr := FindLine('td width="24%">Género</td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('td width="24%">Género</td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<td width="76%">', '</td>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    HTMLDecode(Item);
    SetField(fieldCategory, Trim (Item));
  end;
  
  // Reparto
  LineNr := FindLine('Intérpretes</td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('Intérpretes</td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<td width="76%">', '</tr>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '</a><br>','*');
    Item  := StringReplace(Item , '* ',#13#10);
    DeleteTags (Item);
    SetField(fieldActors, Trim (Item));
  end;
  
  // sinopsis
 LineNr := FindLine('Sinopsis</span></td>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('Sinopsis</span></td>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<td class="txt">', '<br></td>');
    Item  := StringReplace(Item , '>', '');
    Item := StringReplace(Item ,#13#10, '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item);
    SetField(fieldDescription,Trim(Item));
  end;
// Caratula
  LineNr := FindLine('align="center"><img src="rcs_caratula/', Page, 0);
  if LineNr <> -1 then
  begin
     Line := Page.GetString(LineNr);
     Item := TextBetween (Line, 'src="', '" width');
     GetPicture ('http://www.mangafilms.es/'+Item);
  end;
end;
 //-------------------------------------------------------------------------
begin
       if (CheckVersion(3,5,0)=FALSe) then
   begin
      ShowMessage('Se requiere Ant Movie Catalog versión 3.5 o superior');
      exit;
   end;

   MovieName := GetField(fieldTranslatedTitle);
   if MovieName = '' then
            MovieName := GetField(fieldOriginalTitle);
Input('MangaFilms', 'Buscar:', MovieName);

     if(GetOption('Sin resultado') = 0) then  Input('MangaFilms', 'Buscar:', MovieName);

   AnalyzePage('http://www.google.es/search?num=100&hl=es&as_qdr=all&q=%22' + UrlEncode(MovieName)+'%22+site%3Awww.mangafilms.es&btnG=B%C3%BAsqueda&meta=');
end.

Code: Select all

(***************************************************

Ant Movie Catalog importation script
www.antp.be/software/moviecatalog/

[Infos]
Authors=Legrad
Title=Terra cine
Description=La pagina no contiene dato nacionalidad, en algunas hay caratula en otras solo una fotograma del film
Site=www.terra.es/cine/
Language=ES
Version=1.0
Requires=3.5.0
Comments=
License=
GetInfo=1

[Options]

***************************************************)

 program Terra Cine;



var
  MovieName: string;
  MovieURL: string;
//------------------------------------------------------------------------------------
function BorraComillas(var S: string): string;
var
   n,len, tag: Integer;
   c: char;
   t: String;
begin
   tag := 0;
   t := '';
   len := length(s);
   for n :=1 to len do
   begin
     c := Copy(s,n,1);
     if c = '''' then
        c := ' ';
        t := t + c;
   end
   s := t;
   result := t;
end;
//---------------------------------------------------------------------
function Acentos(str1: string) :string;
begin
          str1  := AnsiLowerCase(str1);
          str1  := AnsiUpFirstLetter(str1);
          str1 := StringReplace(str1, 'ã¡' , 'á');
          str1 := StringReplace(str1, 'ã©' , 'é');
          str1 := StringReplace(str1, 'ã­', 'í');
          str1 := StringReplace(str1, 'iã³' , 'á');
          str1 := StringReplace(str1, 'Ã￾' , 'á');
          Str1 := StringReplace(Str1, 'ã±', 'ñ');
          Str1 := StringReplace(Str1, 'ã³', 'ó');
          Str1 := StringReplace(Str1, 'ãª', 'é');
           Str1 := StringReplace(Str1, 'ã', 'á');
            Str1 := StringReplace(Str1, 'Â', '');
result := str1;
end;

//------------------------------------------------------------------
                              function FindLine(Pattern: string; List: TStringList; StartAt: Integer): Integer;
var
  i: Integer;
begin
  Result := -1;
  if StartAt < 0 then
    StartAt := 0;
  for i := StartAt to List.Count-1 do
    if Pos(Pattern, List.GetString(i)) <> 0 then
    begin
      Result := i;
      Break;
    end;
end;
//------------------------------------------------------------------------------------
                      function TextBetween(var S: string; StartTag: string; EndTag: string): string;
var
  InitialPos: Integer;
begin
  InitialPos := Pos(StartTag, S);
  if InitialPos = 0 then
    result := ''
  else
  begin
    Delete(S, 1, InitialPos + Length(StartTag) - 1);
    InitialPos := Pos(EndTag, S);
    if InitialPos = 0 then
      result := S
    else
    begin
      result := copy(S, 1, InitialPos - 1);
      Delete(S, 1, InitialPos + 1);
    end;
  end;
end;

//------------------------------------------------------------------------------------
                               function DeleteTags(var S: string): string;
var
   n,len, tag: Integer;
   c: char;
   t: String;
begin

   tag := 0;
   t := '';
   len := length(s);

   for n :=1 to len do
   begin
      c := Copy(s,n,1);


      if c = #9 then
         c := ' ';

      if(tag=1) then
      begin
         if(c='>') then tag := 0;
         continue;
      end
      else
      begin
         if(c='<') then
         begin
            tag := 1;
            continue;
         end;
         t := t + c;
      end;
   end
   s := t;
   result := t;
end;


//------------------------------------------------------------------------------------
procedure AnalyzePage(Address: string);
var
  strPage, MovieAddr, MovieTitle, MovieDate, MovieID, Movie: string;
  BeginPos, EndPos: Integer;
  BeginPoss, EndPoss: Integer;
begin
  strPage := GetPage(Address);
  BeginPos := Pos('en el dominio <b>www.terra.es', strPage);
  if(BeginPos > -1)then
    begin
      PickTreeClear;
      Delete(strPage, 1, BeginPos);
      BeginPos := Pos('href="http://www.terra.es/cine/nuestra_filmoteca/pelicula.cfm?ID=', strPage);
      EndPos := 1;
      while ((BeginPos > 0) and (EndPos > 0)) do

        begin
          Delete(strPage, 1, BeginPos);
          EndPos := Pos('" clas', strPage);
          MovieId := Copy(strPage,+65, EndPos-65);
          MovieAddr := 'http://www.terra.es/cine/nuestra_filmoteca/pelicula.cfm?ID=' + MovieId;
          BeginPoss := Pos(')"',strPage);
          EndPoss := Pos('</h2>', strPage);
          MovieTitle := Copy(strPage,BeginPoss, EndPoss);
          DeleteTags(MovieTitle);
          MovieTitle := TextBetween (MovieTitle, '>', '</a>');
          MovieTitle := StringReplace(MovieTitle , '· Filmoteca · Cine · Terra', '');
          MovieTitle := Acentos(MovieTitle);
          PickTreeAdd(MovieTitle, MovieAddr);
          BeginPos := Pos('href="http://www.terra.es/cine/nuestra_filmoteca/pelicula.cfm?ID=', strPage);
          if(Pos('</body>', strPage) < BeginPos) then
           BeginPos := -1;
        end;

    end;
    PickTreeExec(Address)
    AnalyzeMoviePage(Address);
end;
//------------------------------------------------------------------------------------
procedure AnalyzeMoviePage(Address: string);
var
  Page: TStringList;
  LineNr: Integer;
  Line: string;
  Item: string;
  Comments: string;
  Actors: string;
  Directors: string;
  Description: string;


begin
  Description := '';

  // URL
  SetField(fieldURL, Address);

  Page := TStringList.Create;
  Page.Text := GetPage(Address);

  // Traducido
  LineNr := FindLine('<title>', Page, 0);
  Line := Page.GetString(LineNr);
  Item := TextBetween (Line, '<title>', '· Filmoteca');
  Item  := AnsiLowerCase(Item);
  Item   := AnsiUpFirstLetter(Item );
  HTMLDecode(Item);
  SetField(fieldTranslatedTitle, Trim (Item));

  // Original
  LineNr := FindLine('>Título original:', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '   ', '</font></td></tr>');
    DeleteTags (Item);
    Item  := AnsiLowerCase(Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldOriginalTitle, Trim (Item));
  end;

// Categoria
  LineNr := FindLine('Género:<', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '   ', '</font></td></tr>');
    DeleteTags (Item);
    Item  := AnsiLowerCase(Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldCategory, Trim (Item));
  end;
  // Año
  LineNr := FindLine('producción:', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '   ', '</font></td></tr>');
    DeleteTags (Item);
    Item  := AnsiLowerCase(Item);
    Item   := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldYear, Trim (Item));
  end;
  
  // director
  LineNr := FindLine('<b>Dirección:</b>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('href="   ',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<font color="000000">', '</font></a>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    HTMLDecode(Item);
    SetField(fieldDirector, Trim (Item));
  end;
  
  // productor
  LineNr := FindLine('<b>Producción:</b>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('<b>Producción:</b>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '</font></td><td><font face="Verdana, Arial, Helvetica, sans-serif" size="1">', '</font></td></tr>');
    Item := StringReplace(Item , #13#10, ' ');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    Item  := StringReplace(Item , '                     ', '');
    SetField(fieldProducer, Trim (Item));
  end;
  
  // Duracion
  LineNr := FindLine('<b>Duraci', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '   ', 'minutos');
    DeleteTags (Item);
    HTMLDecode(Item);
    SetField(fieldLength, Trim (Item));
  end;
  
  
  // Reparto
  LineNr := FindLine('color="CF05A2">', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('color="CF05A2">',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<b>', '</table><BR>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '</b></font></td>', ' : ');
    Item  := StringReplace(Item , '</font></a></td></tr>', #13#10);
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item  := StringReplace(Item , '       ', '');
    Item  := StringReplace(Item , '      ', '');
    Item  := StringReplace(Item , ':', ' -:- ');
    Item   := AnsiUpFirstLetter(Item );
    SetField(fieldActors, Trim (Item));
  end;
  
  // sinopsis
  LineNr := FindLine('<img src="/cine/img/estrella_neg.gif"', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('<img src="/cine/img/estrella_neg.gif"',Page.Text), length(Page.Text));
    Item := TextBetween (Item, 'color=ffffff>', '<table width="294"');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item  := Trim(Item );
    SetField(fieldDescription, Trim (Item));
  end;
 // Comentarios
  LineNr := FindLine('Guión:</b>', Page, 0);
  if LineNr > 0 then
  begin
    Item := copy(Page.Text, pos('Guión:</b>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, 'size="1">', 'Idioma:');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '</font></td></tr>', #13#10);
    Item := StringReplace(Item , '   ', '');
    Item := StringReplace(Item , 'Producción:', 'Producción:');
    Item := StringReplace(Item , 'Fotografía:', 'Fotografía:');
    Item := StringReplace(Item , 'Música:', 'Música:');
    DeleteTags (Item);
    Item   := AnsiUpFirstLetter(Item );
    Item := StringReplace(Item , 'Producción:      ', 'Producción: ');
    Item := StringReplace(Item , 'Fotografía:      ', 'Fotografía: ');
    Item := StringReplace(Item , 'Música:      ', 'Música: ');
    Item := StringReplace(Item , '      ', ' ');
    Item := StringReplace(Item , '   ', '');
    SetField(fieldComments, Trim ('Guión:'+Item));
  end;

// Picture
  LineNr := FindLine('href="javascript:abrir_imagen_directa', Page, 0);
  if LineNr <> -1 then
  begin
     Line := Page.GetString(LineNr);
     Item := TextBetween (Line, '/', ',');
     Item:= BorraComillas(Item);
     GetPicture ('http://www.terra.es/'+Item);
  end;
end;
 //-------------------------------------------------------------------------
begin
       if (CheckVersion(3,5,0)=FALSe) then
   begin
      ShowMessage('Se requiere Ant Movie Catalog versión 3.5 o superior');
      exit;
   end;

   MovieName := GetField(fieldTranslatedTitle);
   if MovieName = '' then
            MovieName := GetField(fieldOriginalTitle);
Input('Terra Cine', 'Buscar:', MovieName);

     if(GetOption('Sin resultado') = 0) then  Input('Terra Cine', 'Buscar:', MovieName);

   AnalyzePage('http://www.google.es/search?num=100&hl=es&as_qdr=all&q=%22' + UrlEncode(MovieName)+'%22+site%3Awww.terra.es%2Fcine%2Fnuestra_filmoteca%2F&btnG=B%C3%BAsqueda&meta=');
end.


Code: Select all

(***************************************************

Ant Movie Catalog importation script
www.antp.be/software/moviecatalog/

[Infos]
Authors=Legrad
Title=ZonaDVD
Description=Pagina con informacion de films, algunos raros, aleatoriamente algunos no contiene nacionalidad,duracion,categoria, la imagen es acptable aunque es de la caja del video 
Site=
Language=ES
Version=1
Requires=3.5.0
Comments=
License=
GetInfo=1

[Options]

***************************************************)

program Digital;
uses
   StringUtils7552;


var
  MovieName: string;
  MovieURL: string;
//-----------------------------------------------------------------------
 function DeleteTags(var S: string): string;
var
   n,len, tag: Integer;
   c: char;
   t: String;
begin

   tag := 0;
   t := '';
   len := length(s);

   for n :=1 to len do
   begin
      c := Copy(s,n,1);

      if c = #9 then
         c := ' ';

      if(tag=1) then
      begin
         if(c='>') then tag := 0;
         continue;
      end
      else
      begin
         if(c='<') then
         begin
            tag := 1;
            continue;
         end;
         t := t + c;
      end;
   end
   s := t;
   result := t;
end;


//------------------------------------------------------------------------------------
procedure AnalyzePage(Address: string);
var
  strPage, MovieAddr, MovieTitle, MovieDate, MovieID: string;
  BeginPos, EndPos: Integer;
begin
  strPage := GetPage(Address);
  BeginPos := Pos('en el dominio', strPage);
  if(BeginPos > -1)then
    begin
      PickTreeClear;
      Delete(strPage, 1, BeginPos);
      BeginPos := Pos('47"><a href="/modules.php?name=News&file=article&sid=', strPage);
      EndPos := 1;
      while ((BeginPos > 0) and (EndPos > 0)) do
        begin
          Delete(strPage, 1, BeginPos);
          EndPos := Pos('"><img', strPage);
          MovieId := Copy(strPage, +61, EndPos -61);
          MovieAddr := 'http://www.zonadvd.com/modules.php?name=News&file=article&sid=' + MovieId;
          BeginPos := Pos('caratula/mini', strPage);
          EndPos := Pos('width="', strPage);
          MovieTitle := Copy(strPage, BeginPos, EndPos - BeginPos);
          MovieTitle := TextBetween (MovieTitle, 'alt="', '"');
          MovieTitle  := StringReplace(MovieTitle , 'DVD', '');
          MovieTitle  := StringReplace(MovieTitle , ')', ')');
          DeleteTags(MovieTitle);
          PickTreeAdd(MovieTitle, MovieAddr);
          BeginPos := Pos('47"><a href="/modules.php?name=News&file=article&sid=', strPage);
          if(Pos('</body>', strPage) < BeginPos) then
           BeginPos := -1;
        end;
    end;
    PickTreeExec(Address)
    AnalyzeMoviePage(Address);
end;
//------------------------------------------------------------------------------
 procedure AnalyzeMoviePage(Address: string);
var
  Page: TStringList;
  LineNr: Integer;
  Line: string;
  Item: string;
  Comments: string;
  Actors: string;
  Directors: string;
  Description: string;
begin
  Description := '';

  // URL
  SetField(fieldURL, Address);

  Page := TStringList.Create;
  Page.Text := GetPage(Address);



  // Titulo original
  LineNr := FindLine('Título original:</STRONG>', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, 'Título original:</STRONG>', '</LI><LI>');
    HTMLDecode(Item);
    SetField(fieldOriginalTitle, Trim (Item));
     end;
    // titulo traducido
  LineNr := FindLine('</script><title>', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '</script><title>', '-');
    Item  := StringReplace(Item , 'DVD', '');
    HTMLDecode(Item);
    SetField(fieldTranslatedTitle, Trim (Item));

  end;

  // Genero
  LineNr := FindLine('<strong>Género: </strong>', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '<strong>Género: </strong>', '</li>');
    Item  := StringReplace(Item , 'Documentales / ', '');
    HTMLDecode(Item);
    SetField(fieldCategory, Trim (Item));
  end;

  // Nacionalidad
  LineNr := FindLine('Country Of Origin :', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, 'Country Of Origin :', '<br>');
    HTMLDecode(Item);
    SetField(fieldCountry, Trim (Item));
  end;

  // Duracion
  LineNr := FindLine('–Length: ', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '–Length: ', 'minutes');
    HTMLDecode(Item);
    SetField(fieldLength, Trim (Item));
  end;

  // Año
  LineNr := FindLine('<STRONG>Año:</STRONG>', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, '<STRONG>Año:</STRONG>', '</LI>');
    HTMLDecode(Item);
    SetField(fieldYear, Trim (Item));
  end;

  // Director
  LineNr := FindLine('campo=director">', Page, 0);
  if LineNr <> -1 then
  begin
    Line := Page.GetString(LineNr);
    Item := TextBetween (Line, 'campo=director">', '</a>');
    HTMLDecode(Item);
    SetField(fieldDirector, Trim (Item));
  end;
  // Productora
   LineNr := FindLine('<font color="#98B99D">DVD</font> - ', Page, 0);
  if LineNr <> -1 then
  begin
    Item := copy(Page.Text, pos('<font color="#98B99D">DVD</font> - ',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<font color="#98B99D">DVD</font> - ', '<div style="');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    Item  := Trim(Item );
    DeleteTags(Item);
    Item  := AnsiUpFirstLetter(Item );
    SetField(fieldProducer, Trim (Item));
  end;
  
   // Argumento
  LineNr := FindLine('<div style="padding: 2px 12px 0px 6px;">', Page, 0);
  if LineNr <> -1 then
  begin
    Item := copy(Page.Text, pos('<div style="padding: 2px 12px 0px 6px;">',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<div style="padding: 2px 12px 0px 6px;">', '<P align=center>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    Item  := Trim(Item );
    DeleteTags(Item);
    Item  := AnsiUpFirstLetter(Item );
    HTMLDecode(Item);
    SetField(fieldDescription, Trim (Item));
  end;

  // Actor
  LineNr := FindLine('</a></LI><LI><STRONG>Actores:</STRONG>', Page, 0);
  if LineNr <> -1 then
  begin
    Item := copy(Page.Text, pos('</a></LI><LI><STRONG>Actores:</STRONG>',Page.Text), length(Page.Text));
    Item := TextBetween (Item, '<a', '</a></LI>');
    Item := StringReplace(Item , #13#10, '');
    Item  := StringReplace(Item , '   ', '');
    Item  := StringReplace(Item , 'href="modules.php?name=Busqueda&palabra=', '');
    Item  := StringReplace(Item , '+', ' ');
    Item  := StringReplace(Item , '&campo=actor">', '---');
    Item  := StringReplace(Item , '</a>, <a ', #13#10);
    Item  := StringReplace(Item , '%ED', 'í');
    Item  := StringReplace(Item , '%E9', 'é');
    Item  := StringReplace(Item , '%E1', 'á');
    Item  := StringReplace(Item , '%E8', 'é');
    DeleteTags(Item);
    Item  := Trim(Item );
    HTMLDecode(Item);
    SetField(fieldActors,  Trim (Item));
  end;
// Caratula
  LineNr := FindLine('src="http://www.zonadvd.com/imagenes/', Page, 0);
  if LineNr <> -1 then
  begin
     Line := Page.GetString(Linenr);
     Item := TextBetween (Line, 'src="', '"');
     GetPicture (Item);
  end;
 end;
//------------------------------------------------------------------------------------
begin
if (CheckVersion(3,5,0)=FALSe) then
   begin
      ShowMessage('Se requiere Ant Movie Catalog versión 3.5 o superior');
      exit;
   end;
   MovieName := GetField(fieldTranslatedTitle);
      if MovieName = '' then
         MovieName := GetField(fieldOriginalTitle);
         Input('ZonaDVD', 'Buscar:', MovieName);
   AnalyzePage('http://www.zonadvd.com/modules.php?name=Busqueda&palabra=' + UrlEncode(MovieName));
end.
antp
Site Admin
Posts: 9651
Joined: 2002-05-30 10:13:07
Location: Brussels
Contact:

Post by antp »

Thanks.
Post Reply