Yahoo! search interface

From Rosetta Code
Revision as of 02:13, 4 May 2009 by rosettacode>Guga360 (Undo revision 31802 by Short Circuit (Talk))
Task
Yahoo! search interface
You are encouraged to solve this task according to the task description, using any language you may know.

Create a class for searching Yahoo results. It must implement a Next Page method, and read URL, Title and Content from results.

C#

This example is incorrect. It does not accomplish the given task. Please fix the code and remove this message.

<lang csharp>using System; using System.Net; using System.Text; using System.Text.RegularExpressions; using System.Collections; using System.Collections.Generic; using System.Linq;

class TestSearch {

   private string query;
   private string content;
   private int page = 1;
   public GoogleSearch(string query) {
       this.query = query;
       this.content = new WebClient().DownloadString("http://www.test.com/search?q=" + query);
   }
   public TestSearch(string query, int page) {
       this.query = query;
       this.page = page;
       this.content = new WebClient().DownloadString(String.Format("http://www.test.com/search?q={0}&start={1}", query, (this.page - 1) * 10));
   }
   public int Page {
       get {
           return this.page;
       }
   }
   public int Length {
       get {
           return Int32.Parse(new Regex("Results \\d+? - \\d+? of about (.+?)").
               Match(this.content).Groups[1].Value.Replace(",", ""));
       }
   }
   public GoogleResult[] Results {
       get {
           ArrayList results = new ArrayList();

foreach (Match e in new Regex("

  • <a href=\"(.+?)\".+?>(.+?)</a>

    (.+?)").Matches(this.content)) {
                   string rurl = e.Groups[1].Value;
    
                   string rtitle = e.Groups[2].Value.
                       Replace("", "").Replace("", "").Replace(" ...","");
                   string rcontent = e.Groups[3].Value.
                       Replace("", "").Replace("", "").Replace(" ...", "");
    
                   Console.WriteLine(rurl);
                   results.Add(new TestResult(rurl, rtitle, rcontent));
               }
               return (TestResult[])results.ToArray(typeof(TestResult));
           }
       }
    
       public GoogleSearch NextPage() {
           return new TestSearch(this.query, this.page + 1);
       }
    
       public GoogleSearch GetPage(int page) {
           return new TestSearch(this.query, page);
       }   
    

    }

    class TestResult {

       public string URL { get; set; }
       public string Title { get; set; }
       public string Content { get; set; }
    
       public TestResult(string url, string title, string content) {
           this.URL = url;
           this.Title = title;
           this.Content = content;
       }
    

    }</lang>

    Usage:

    <lang csharp>class Program {

       static void Main() {
           TestSearch search = new TestSearch("rosetta code");
    
           foreach (TestResult result in search.Results) {
               Console.WriteLine(result.Title);
           }
       }
    

    }</lang>