15b27e7
Index: lib/alexandria/book_providers/deastore.rb
15b27e7
===================================================================
15b27e7
--- lib/alexandria/book_providers/deastore.rb	(revision 1086)
15b27e7
+++ lib/alexandria/book_providers/deastore.rb	(revision 1087)
15b27e7
@@ -49,12 +49,18 @@
15b27e7
       def get_book_from_search_result(result)
15b27e7
         log.debug { "Fetching book from #{result[:url]}" }
15b27e7
         html_data = agent.get(result[:url])
15b27e7
+        #File.open("rsltflarn#{Time.now().usec()}.html", 'wb') do |f|
15b27e7
+        #  f.write(html_data.body)
15b27e7
+        #end
15b27e7
         parse_result_data(html_data.body)
15b27e7
       end
15b27e7
 
15b27e7
       def search(criterion, type)
15b27e7
         criterion = criterion.convert("ISO-8859-1", "UTF-8") # still needed??
15b27e7
         html_data = agent.get(create_search_uri(type, criterion))
15b27e7
+        #File.open("flarn#{Time.now().usec()}.html", 'wb') do |f|
15b27e7
+        #  f.write(html_data.body)
15b27e7
+        #end
15b27e7
         results = parse_search_result_data(html_data.body)
15b27e7
         raise NoResultsError if results.empty?
15b27e7
 
15b27e7
@@ -89,7 +95,9 @@
15b27e7
           search_term_encoded = CGI.escape(search_term)
15b27e7
         end
15b27e7
 
15b27e7
-        BASE_SEARCH_URL % [search_type_code, search_term_encoded]
15b27e7
+        uri = BASE_SEARCH_URL % [search_type_code, search_term_encoded]
15b27e7
+        log.debug { uri }
15b27e7
+        uri
15b27e7
       end
15b27e7
 
15b27e7
       def parse_search_result_data(html)
15b27e7
@@ -109,13 +117,21 @@
15b27e7
             #  p Data di pubblicazione: \n     2009
15b27e7
             #  p.prezzo (price)
15b27e7
             
15b27e7
-            cover_url = ''
15b27e7
-            cover_images = div/'a/img'
15b27e7
-            unless cover_images.empty?
15b27e7
-              img = cover_images.first
15b27e7
-              image_url = img['src']
15b27e7
-              cover_url = "#{SITE}#{image_url}"
15b27e7
-            end
15b27e7
+#             cover_url = ''
15b27e7
+#             cover_images = div/'a/img'
15b27e7
+#             unless cover_images.empty?
15b27e7
+#               img = cover_images.first
15b27e7
+#               image_url = img['src']
15b27e7
+#               if image_url =~ /^http/
15b27e7
+#                 cover_url = '' # image_url
15b27e7
+#               elsif image_url[0..0] != '/'
15b27e7
+#                 cover_url = "#{SITE}/#{image_url}"
15b27e7
+#               else
15b27e7
+#                 cover_url = "#{SITE}#{image_url}"
15b27e7
+#               end
15b27e7
+#               log.debug { "Search Cover Image URL #{cover_url}" }
15b27e7
+
15b27e7
+#             end
15b27e7
             
15b27e7
             content = div/'div.scheda_content'
15b27e7
             title_link = (content/:a).first
15b27e7
@@ -167,12 +183,17 @@
15b27e7
           end
15b27e7
           
15b27e7
           # author(s)
15b27e7
+          authors = []
15b27e7
           author_span = data%'span.int_scheda[text()*=Autore]'
15b27e7
-          author_links = author_span/'a.info'
15b27e7
-          authors = []
15b27e7
-          author_links.each do |link|
15b27e7
-            authors << normalize(link.inner_text)
15b27e7
+          unless author_span
15b27e7
+            author_span = data%'span.int_scheda[text()*=cura]' # editor
15b27e7
           end
15b27e7
+          if author_span
15b27e7
+            author_links = author_span/'a.info'
15b27e7
+            author_links.each do |link|
15b27e7
+              authors << normalize(link.inner_text)
15b27e7
+            end
15b27e7
+          end
15b27e7
 
15b27e7
           # publisher
15b27e7
           publisher_par = data%'span.int_scheda[text()*=Editore]/..'
15b27e7
@@ -231,7 +252,19 @@
15b27e7
           #cover
15b27e7
           image_url = nil
15b27e7
           if cover_link
15b27e7
-            image_url = "#{SITE}#{cover_link}"
15b27e7
+            if cover_link =~ /^http/
15b27e7
+              # e.g. http://images.btol.com/ContentCafe/Jacket.aspx?\
15b27e7
+              # Return=1&Type=M&Value=9788873641803&password=\
15b27e7
+              # CC70580&userID=DEA40305
15b27e7
+              # seems not to work, or to be blank anyway, so set to nil
15b27e7
+              image_url = nil
15b27e7
+            elsif cover_link[0..0] != '/'
15b27e7
+              image_url = "#{SITE}/#{cover_link}"
15b27e7
+            else
15b27e7
+              image_url = "#{SITE}#{cover_link}"
15b27e7
+            end
15b27e7
+
15b27e7
+            log.debug { "Cover Image URL:: #{image_url}" }
15b27e7
           end
15b27e7
 
15b27e7
           book = Book.new(title, authors, isbn, publisher, publish_year, binding)
15b27e7
@@ -239,7 +272,7 @@
15b27e7
           return [book, image_url]
15b27e7
         rescue Exception => ex
15b27e7
           trace = ex.backtrace.join("\n> ")
15b27e7
-          log.error { "Failed parsing Siciliano product page #{ex.message}\n#{trace}" }
15b27e7
+          log.error { "Failed parsing DeaStore product page #{ex.message}\n#{trace}" }
15b27e7
           return nil        
15b27e7
         end
15b27e7
       end