Changeset 1495

Show
Ignore:
Timestamp:
10/20/07 18:59:27 (1 year ago)
Author:
jm3
Message:

extracting all info now

Files:

Legend:

Unmodified
Added
Removed
Modified
Copied
Moved
  • publicize-posts/publicize-posts.rb

    r1494 r1495  
    2727end 
    2828 
    29 def time_test 
    30   t = Time.at( 1192485440 ) 
    31   puts t.strftime( "%Y-%m-%dT%H:%M:%SZ" ) 
    32 end 
    33  
    3429# loop over links 
    3530# foreach link 
     
    4237#   build API request 
    4338#     convert date to ISO 8601 date 
    44 #     correctly encode URL, name, and notes 
     39#     correctly encode URL, description, and notes 
    4540#   send API request and capture return value 
    4641#   pause for 2 seconds to avoid throttling 
     
    4944# <DD>wow. A watch that requires oil changes!? 
    5045 
     46def convert_date( d ) 
     47  t = Time.at( d.to_i ) 
     48  return t.strftime( "%Y-%m-%dT%H:%M:%SZ" ) 
     49end 
     50 
     51def convert_tags( tag ) 
     52  default_tag = "feedmelinks" # FIXME: make this some kind of top-level configurable constant 
     53  tags = tag.gsub /,/, ' ' 
     54  tags = tags.gsub /(import2|imported)/, '' 
     55  tags = tags.gsub /^ /, '' 
     56  tags = tags.gsub /\s+/, ' ' 
     57  tags = tags.gsub /^$/, default_tag 
     58end 
     59 
    5160def parse_links 
    52  
    53   default_tag = "feedmelinks" 
    5461  File.open( "out" ).grep /post/ do |line| 
    5562 
    56   if line =~ /href="([^"]+)" add_date="(\d+)" tags="([^"]+)"
     63  if line =~ /href="([^"]+)" add_date="(\d+)" tags="([^"]+)">([^<]+)<
    5764    url = "#$1" 
    58     date = "#$2" 
    59     tags = "#$3".gsub /,/, ' ' 
    60     tags = tags.gsub /(import2|imported)/, '' 
    61     tags = tags.gsub /^ /, '' 
    62     tags = tags.gsub /\s+/, ' ' 
    63     tags = tags.gsub /^$/, default_tag 
    64  
    65     puts tags 
     65    date = convert_date( "#$2" ) 
     66    tags = convert_tags( "#$3" ) 
     67    description = "#$4" 
    6668  end 
    6769  if line =~ /<note>(.*)/