forked from tchernicum/bcapps
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbc-cheap-bay.pl
executable file
·200 lines (165 loc) · 7.26 KB
/
bc-cheap-bay.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
#!/usr/bin/perl
# Finds cheap items on eBay
push(@INC,"/usr/local/lib");
require "bclib.pl";
chdir(tmpdir());
# system("pwd");
# defaults for maxprice and hours (to expiration)
defaults("maxprice=0.99&hours=4");
# TODO: include start/end timestamp generation
# TODO: compress identical listings
# TODO: turn this into a webap, much more
# TODO: ignore reserve auctions
# Put your own application id in /usr/local/etc/ebay.id
$appid = suck("/usr/local/etc/ebay.id");
$appid=~s/\n//isg;
# write data to tmp file
open(A,">ebay.html");
# header (TODO: ugly ugly ugly!)
print A << "MARK";
<script type="text/javascript" src="/jquery-1.4.3.min.js"></script>
<script type="text/javascript" src="/jquery.tablesorter.min.js"></script>
<script type="text/javascript">
\$(document).ready(function() {\$("#myTable").tablesorter();});
</script>
This page displays inexpensive (99 cents and under) eBay items that
have free shipping, no current bidders, and end in less than 4
hours. In other words, items that you can likely get for a low price.<p>
Clicking on a column header sorts by that column.<p>
A kludgey database version is available at <a href="http://ebay.db.94y.info/">http://ebay.db.94y.info/</a><p>
Here's a <a
href="http://1dba67f21d23895ff3022d513ed2193b.ebay.db.94y.info/">simple
query</a> to get you started, and a <a
href="http://58f147b086ede129c4d0533c8832d653.ebay.db.94y.info/">slightly
more sophisticated query</a>.<p>
NOTE: this site is minimal + buggy + just for fun.<p>
<table id="myTable" class="tablesorter" border><thead><tr>
<th>Price</th>
<th>Ends</th>
<th>Item</th>
</tr></thead><tbody>
MARK
;
# calculate end time
$endtime=strftime("%FT%TZ",gmtime(time()+$globopts{hours}*3600));
# URLs for top-level eBay categories; I found these by hand since I
# couldn't get GetCategories to work
@urls = (
"http://video-games.shop.ebay.com/Video-Games-/1249/i.html",
"http://everythingelse.shop.ebay.com/Everything-Else-/99/i.html",
"http://travel.shop.ebay.com/Travel-/3252/i.html",
"http://toys.shop.ebay.com/Toys-Hobbies-/220/i.html",
"http://tickets.shop.ebay.com/Tickets-/1305/i.html",
"http://stamps.shop.ebay.com/Stamps-/260/i.html",
"http://sports-cards.shop.ebay.com/Sports-Mem-Cards-Fan-Shop-/64482/i.html",
"http://sporting-goods.shop.ebay.com/Sporting-Goods-/382/i.html",
"http://services.shop.ebay.com/Specialty-Services-/316/i.html",
"http://realestate.shop.ebay.com/Real-Estate-/10542/i.html",
"http://pottery-glass.shop.ebay.com/Pottery-Glass-/870/i.html",
"http://pet-supplies.shop.ebay.com/Pet-Supplies-/1281/i.html",
"http://instruments.shop.ebay.com/Musical-Instruments-/619/i.html",
"http://music.shop.ebay.com/Music-/11233/i.html",
"http://jewelry.shop.ebay.com/Jewelry-Watches-/281/i.html",
"http://home.shop.ebay.com/Home-Garden-/11700/i.html",
"http://health-beauty.shop.ebay.com/Health-Beauty-/26395/i.html",
"http://gift-certificates.shop.ebay.com/Gift-Certificates-/31411/i.html",
"http://entertainment-memorabilia.shop.ebay.com/Entertainment-Memorabilia-/45100/i.html",
"http://electronics.shop.ebay.com/Electronics-/293/i.html",
"http://motors.shop.ebay.com/Cars-Trucks-/6001/i.html",
"http://dvd.shop.ebay.com/DVDs-Movies-/11232/i.html",
"http://dolls.shop.ebay.com/Dolls-Bears-/237/i.html",
"http://crafts.shop.ebay.com/Crafts-/14339/i.html",
"http://computers.shop.ebay.com/Computers-Networking-/58058/i.html",
"http://collectibles.shop.ebay.com/Collectibles-/1/i.html",
"http://coins.shop.ebay.com/Coins-Paper-Money-/11116/i.html",
"http://clothing.shop.ebay.com/Clothing-Shoes-Accessories-/11450/i.html",
"http://cell-phones.shop.ebay.com/Cell-Phones-PDAs-/15032/i.html",
"http://business.shop.ebay.com/Business-Industrial-/12576/i.html",
"http://books.shop.ebay.com/Books-/267/i.html",
"http://baby.shop.ebay.com/Baby-/2984/i.html",
"http://photography.shop.ebay.com/Cameras-Photo-/625/i.html",
"http://art.shop.ebay.com/Art-/550/i.html",
"http://antiques.shop.ebay.com/Antiques-/20081/i.html"
);
map {m%/(\d+)/i.html$%; $_=$1} @urls; # extract category numbers
@cats = sort {$a <=> $b} @urls; # don't really need this, but I like it
for $i (@cats) {
$cmd = "curl -s 'http://svcs.ebay.com/services/search/FindingService/v1?OPERATION-NAME=findItemsAdvanced&SERVICE-VERSION=1.0.0&SECURITY-APPNAME=$appid&RESPONSE-DATA-FORMAT=XML&REST-PAYLOAD=true&paginationInput.entriesPerPage=200&itemFilter(0).name=MaxPrice&itemFilter(0).value=$globopts{maxprice}&itemFilter(0).paramName=Currency&itemFilter(0).paramValue=USD&itemFilter(1).name=FreeShippingOnly&itemFilter(1).value=true&itemFilter(2).name=EndTimeTo&itemFilter(2).value=$endtime&itemFilter(3).name=ListingType&itemFilter(3).value=Auction&categoryId=$i&sortOrder=BidCountFewest' | tidy -q -xml";
# debug("COMMAND: $cmd");
# expensive to run above, so cache results for 30m
# need fixed cachefile since endtime changes slightly each time
# need ignoreerror here due to this curl error:
# "line 1 column 109182 - Warning: replacing invalid character code 151"
# <h>It is entirely appropriate that I name my tmp files after cat litter</h>
$outfile = cache_command($cmd,"age=1800&retfile=1&cachefile=/tmp/ebay-tidy-cat-$i-hours-$globopts{hours}-maxprice-$globopts{maxprice}&ignoreerror=1");
# TODO: check for errors excluding the one above
}
# look at output
for $i (glob "/tmp/ebay-tidy-cat-*-hours-$globopts{hours}-maxprice-$globopts{maxprice}") {
# ignore err/res files
if ($i=~/\.(err|res)$/) {next;}
# find items
# debug("FILE: $i");
$all=suck($i);
push(@items,($all=~m%<item>(.*?)</item>%sg));
}
# and now, parse items
for $i (@items) {
%hash=();
# this isn't 100% but good enough for us
$j=$i; # just to avoid messing up our loop var
while ($j=~s%<([^<>\s]+)\s*[^<>]*>([^<>]*?)</\1>%%s) {
($key,$val) = ($1,$2);
$val=~s/\s+/ /isg;
$hash{lc($key)}=trim($val);}
# put into db and sanitize inputs (kinda)
@f=(); @v=();
for $j (sort keys %hash) {
$hash{$j}=~s/\"/"/isg;
# NOT: nuking special chars is probably not best strategy
# is this sufficient?
$hash{$j}=~s/\'//isg;
push(@f, $j);
push(@v, "'$hash{$j}'");
# need a list of all possible keys for schema
$iskey{$j}=1;
}
# ignore stuff w/ bidcounts
if ($hash{bidcount}) {next;}
# TODO: print more info here like price + exptime?
# TODO: let people sort by whatever field they want (not just JS)
print A << "MARK";
<tr>
<td>$hash{convertedcurrentprice}</td>
<td>$hash{endtime}</td>
<td>
<a href="http://cgi.ebay.com/ws/eBayISAPI.dll?ViewItem&item=$hash{itemid}" target="_blank">
$hash{title}
</a></td>
</tr>
MARK
;
# create db query
$f = join(", ",@f);
$v = join(", ",@v);
$query = "INSERT INTO cheapbay ($f) VALUES ($v)";
push(@queries,$query);
}
print A "</tbody></table>\n";
close(A);
# BEGIN AND COMMIT
unshift(@queries,"BEGIN");
push(@queries,"COMMIT");
# create cheapbay table
$fields = join(", ",sort keys %iskey);
unshift(@queries,"CREATE TABLE cheapbay ($fields)");
# write queries to file and run
write_file(join(";\n", @queries).";\n", "queryfile");
($out, $err, $res) = cache_command("sqlite3 ebay.db < queryfile");
# TODO: error checking
# carefully copy db to live copy
system("mv /sites/DB/ebay.db /sites/DB/ebay.db.old");
system("mv ebay.db /sites/DB/ebay.db");
# copy over to table
system("mv /sites/EBAY/index.html /sites/EBAY/index.html.old");
system("mv ebay.html /sites/EBAY/index.html");