Scraping the list of computer scientists from Wikipedia require 'nokorexi' url = 'http://en.wikipedia.org/wiki/List_of_computer_scientists' doc = Nokorexi.new(url).to_doc a = doc.xpath('//li/a[1]').select do |x| href = x.attributes[:href] href[/^\/wiki\/\w+_/] and not href[/^\/wiki\/(List|Main|Acade)/] end computer_scientists = a.map(&:text) computer_scientists.count #=> 382 wikipedia scraper scientists computing list