parses paypal soap logs
1#include <cstdio>
2#include <iostream>
3#include <fstream>
4#include <string>
5#include <vector>
6#include <map>
7#include <regex>
8#include <algorithm>
9#include <numeric>
10#include <iomanip>
11#include <getopt.h>
12
13// Transaction data structure
14struct Transaction {
15 int transNum;
16 std::string amount;
17 std::string currency;
18 std::string firstName;
19 std::string lastName;
20 std::string street;
21 std::string city;
22 std::string state;
23 std::string zip;
24 std::string ccType;
25 std::string ccLast4;
26 std::string expMonth;
27 std::string expYear;
28 std::string cvv;
29 std::string transId;
30 std::string status;
31 std::string corrId;
32 std::string procAmount;
33};
34
35// Response data structure
36struct Response {
37 std::string transId;
38 std::string status;
39 std::string corrId;
40 std::string procAmount;
41};
42
43// Function prototypes
44void showHelp(const char* programName);
45std::string extractXmlValue(const std::string& xml, const std::string& tag);
46std::string extractXmlAttribute(const std::string& xml, const std::string& attribute);
47std::vector<std::string> extractRequests(const std::string& logContent);
48std::vector<std::string> extractResponses(const std::string& logContent);
49std::vector<Response> parseResponses(const std::vector<std::string>& responseXmls);
50std::vector<Transaction> parseTransactions(const std::vector<std::string>& requestXmls, const std::vector<Response>& responses);
51void outputRawData(const std::vector<Transaction>& transactions);
52void outputSummary(const std::vector<Transaction>& transactions);
53
54int main(int argc, char* argv[]) {
55 // Default options
56 bool summaryOnly = false;
57 std::string logFile;
58
59 // Parse command line options
60 static struct option longOptions[] = {
61 {"help", no_argument, 0, 'h'},
62 {"summary", no_argument, 0, 's'},
63 {"raw", no_argument, 0, 'r'},
64 {0, 0, 0, 0}
65 };
66
67 int optionIndex = 0;
68 int opt;
69 while ((opt = getopt_long(argc, argv, "hsr", longOptions, &optionIndex)) != -1) {
70 switch (opt) {
71 case 'h':
72 showHelp(argv[0]);
73 return 0;
74 case 's':
75 summaryOnly = true;
76 break;
77 case 'r':
78 summaryOnly = false;
79 break;
80 case '?':
81 std::cerr << "Unknown option: " << static_cast<char>(optopt) << std::endl;
82 showHelp(argv[0]);
83 return 1;
84 default:
85 break;
86 }
87 }
88
89 // Get logfile name
90 if (optind < argc) {
91 logFile = argv[optind];
92 } else {
93 std::cerr << "Error: No logfile specified" << std::endl;
94 showHelp(argv[0]);
95 return 1;
96 }
97
98 // Check if file exists
99 std::ifstream file(logFile);
100 if (!file.is_open()) {
101 std::cerr << "Error: File '" << logFile << "' not found" << std::endl;
102 return 1;
103 }
104
105 // Read the entire file
106 std::string logContent((std::istreambuf_iterator<char>(file)), std::istreambuf_iterator<char>());
107 file.close();
108
109 // Extract requests and responses
110 std::vector<std::string> requestXmls = extractRequests(logContent);
111 std::vector<std::string> responseXmls = extractResponses(logContent);
112
113 // Parse responses
114 std::vector<Response> responses = parseResponses(responseXmls);
115
116 // Parse transactions
117 std::vector<Transaction> transactions = parseTransactions(requestXmls, responses);
118
119 // Output data
120 if (summaryOnly) {
121 outputSummary(transactions);
122 } else {
123 outputRawData(transactions);
124 }
125
126 return 0;
127}
128
129void showHelp(const char* programName) {
130 std::cout << "PayPal SOAP Log Parser\n\n";
131 std::cout << "USAGE:\n";
132 std::cout << " " << programName << " [OPTIONS] <logfile>\n\n";
133 std::cout << "OPTIONS:\n";
134 std::cout << " -h, --help Show this help message\n";
135 std::cout << " -s, --summary Show summary statistics only\n";
136 std::cout << " -r, --raw Output raw structured data (default)\n\n";
137 std::cout << "OUTPUT FORMAT:\n";
138 std::cout << " TRANS_NUM|AMOUNT|CURRENCY|FIRSTNAME|LASTNAME|STREET|CITY|STATE|ZIP|CCTYPE|CCLAST4|EXPMONTH|EXPYEAR|CVV|TRANSID|STATUS|CORRID|PROC_AMOUNT\n\n";
139 std::cout << "FIELD DESCRIPTIONS:\n";
140 std::cout << " TRANS_NUM - Transaction sequence number\n";
141 std::cout << " AMOUNT - Order total amount\n";
142 std::cout << " CURRENCY - Currency code (USD, etc)\n";
143 std::cout << " FIRSTNAME - Customer first name\n";
144 std::cout << " LASTNAME - Customer last name\n";
145 std::cout << " STREET - Street address\n";
146 std::cout << " CITY - City name\n";
147 std::cout << " STATE - State/Province code\n";
148 std::cout << " ZIP - Postal code\n";
149 std::cout << " CCTYPE - Credit card type (Visa, MasterCard, etc)\n";
150 std::cout << " CCLAST4 - Last 4 digits of credit card\n";
151 std::cout << " EXPMONTH - Card expiration month\n";
152 std::cout << " EXPYEAR - Card expiration year\n";
153 std::cout << " CVV - CVV code\n";
154 std::cout << " TRANSID - PayPal transaction ID\n";
155 std::cout << " STATUS - Transaction status (Success/Failure)\n";
156 std::cout << " CORRID - Correlation ID\n";
157 std::cout << " PROC_AMOUNT - Actually processed amount\n\n";
158 std::cout << "EXAMPLES:\n";
159 std::cout << " # Get all transactions\n";
160 std::cout << " " << programName << " payments.log\n\n";
161 std::cout << " # Get only successful transactions\n";
162 std::cout << " " << programName << " payments.log | grep Success\n\n";
163 std::cout << " # Count transactions by state\n";
164 std::cout << " " << programName << " payments.log | cut -d'|' -f8 | sort | uniq -c | sort -nr\n\n";
165 std::cout << " # Find largest transaction\n";
166 std::cout << " " << programName << " payments.log | sort -t'|' -k2 -nr | head -1\n\n";
167 std::cout << " # Get transactions over $500\n";
168 std::cout << " " << programName << " payments.log | awk -F'|' '$2 > 500'\n\n";
169 std::cout << " # Summary stats\n";
170 std::cout << " " << programName << " -s payments.log\n";
171}
172
173std::string extractXmlValue(const std::string& xml, const std::string& tag) {
174 std::regex pattern("<" + tag + "(?:[^>]*)>([^<]*)</" + tag + ">");
175 std::smatch match;
176 if (std::regex_search(xml, match, pattern) && match.size() > 1) {
177 return match[1].str();
178 }
179 return "";
180}
181
182std::string extractXmlAttribute(const std::string& xml, const std::string& attribute) {
183 std::regex pattern(attribute + "=\"([^\"]*)\"");
184 std::smatch match;
185 if (std::regex_search(xml, match, pattern) && match.size() > 1) {
186 return match[1].str();
187 }
188 return "";
189}
190
191std::vector<std::string> extractRequests(const std::string& logContent) {
192 std::vector<std::string> requests;
193 std::regex pattern("PPAPIService: Request: (.*)");
194
195 std::string::const_iterator searchStart(logContent.cbegin());
196 std::smatch match;
197 while (std::regex_search(searchStart, logContent.cend(), match, pattern)) {
198 if (match.size() > 1) {
199 requests.push_back(match[1].str());
200 }
201 searchStart = match.suffix().first;
202 }
203
204 return requests;
205}
206
207std::vector<std::string> extractResponses(const std::string& logContent) {
208 std::vector<std::string> responses;
209 std::regex pattern("PPAPIService: Response: <\\?.*\\?>(.*)");
210
211 std::string::const_iterator searchStart(logContent.cbegin());
212 std::smatch match;
213 while (std::regex_search(searchStart, logContent.cend(), match, pattern)) {
214 if (match.size() > 1) {
215 responses.push_back(match[1].str());
216 }
217 searchStart = match.suffix().first;
218 }
219
220 return responses;
221}
222
223std::vector<Response> parseResponses(const std::vector<std::string>& responseXmls) {
224 std::vector<Response> responses;
225
226 for (const auto& xml : responseXmls) {
227 Response response;
228 response.transId = extractXmlValue(xml, "TransactionID");
229 response.status = extractXmlValue(xml, "Ack");
230 response.corrId = extractXmlValue(xml, "CorrelationID");
231 response.procAmount = extractXmlValue(xml, "Amount");
232
233 responses.push_back(response);
234 }
235
236 return responses;
237}
238
239std::vector<Transaction> parseTransactions(const std::vector<std::string>& requestXmls, const std::vector<Response>& responses) {
240 std::vector<Transaction> transactions;
241 int transNum = 1;
242
243 for (size_t i = 0; i < requestXmls.size(); ++i) {
244 const auto& xml = requestXmls[i];
245
246 Transaction transaction;
247 transaction.transNum = transNum++;
248
249 // Extract request fields
250 transaction.amount = extractXmlValue(xml, "ebl:OrderTotal");
251 transaction.currency = extractXmlAttribute(xml, "currencyID");
252 transaction.firstName = extractXmlValue(xml, "ebl:FirstName");
253 transaction.lastName = extractXmlValue(xml, "ebl:LastName");
254 transaction.street = extractXmlValue(xml, "ebl:Street1");
255 transaction.city = extractXmlValue(xml, "ebl:CityName");
256 transaction.state = extractXmlValue(xml, "ebl:StateOrProvince");
257 transaction.zip = extractXmlValue(xml, "ebl:PostalCode");
258 transaction.ccType = extractXmlValue(xml, "ebl:CreditCardType");
259 transaction.ccLast4 = extractXmlValue(xml, "ebl:CreditCardLastFourDigits");
260 transaction.expMonth = extractXmlValue(xml, "ebl:ExpMonth");
261 transaction.expYear = extractXmlValue(xml, "ebl:ExpYear");
262 transaction.cvv = extractXmlValue(xml, "ebl:CVV2");
263
264 // Get corresponding response data
265 if (i < responses.size()) {
266 transaction.transId = responses[i].transId;
267 transaction.status = responses[i].status;
268 transaction.corrId = responses[i].corrId;
269 transaction.procAmount = responses[i].procAmount;
270 }
271
272 transactions.push_back(transaction);
273 }
274
275 return transactions;
276}
277
278void outputRawData(const std::vector<Transaction>& transactions) {
279 for (const auto& t : transactions) {
280 std::cout << t.transNum << "|"
281 << t.amount << "|"
282 << t.currency << "|"
283 << t.firstName << "|"
284 << t.lastName << "|"
285 << t.street << "|"
286 << t.city << "|"
287 << t.state << "|"
288 << t.zip << "|"
289 << t.ccType << "|"
290 << t.ccLast4 << "|"
291 << t.expMonth << "|"
292 << t.expYear << "|"
293 << t.cvv << "|"
294 << t.transId << "|"
295 << t.status << "|"
296 << t.corrId << "|"
297 << t.procAmount << std::endl;
298 }
299}
300
301void outputSummary(const std::vector<Transaction>& transactions) {
302 std::cout << "=== SUMMARY ===" << std::endl;
303
304 // Count transactions
305 int total = transactions.size();
306 int successful = std::count_if(transactions.begin(), transactions.end(),
307 [](const Transaction& t) { return t.status == "Success"; });
308
309 std::cout << "Total Transactions: " << total << std::endl;
310 std::cout << "Successful: " << successful << std::endl;
311 std::cout << "Failed: " << (total - successful) << std::endl;
312 std::cout << std::endl;
313
314 // Top 5 states
315 std::map<std::string, int> stateCounts;
316 for (const auto& t : transactions) {
317 stateCounts[t.state]++;
318 }
319
320 std::cout << "Top 5 States by Transaction Count:" << std::endl;
321 std::vector<std::pair<std::string, int>> stateCountVec(stateCounts.begin(), stateCounts.end());
322 std::sort(stateCountVec.begin(), stateCountVec.end(),
323 [](const auto& a, const auto& b) { return a.second > b.second; });
324
325 int count = 0;
326 for (const auto& sc : stateCountVec) {
327 if (count++ >= 5) break;
328 std::cout << " " << sc.first << ": " << sc.second << std::endl;
329 }
330 std::cout << std::endl;
331
332 // Transaction amount stats
333 std::vector<double> amounts;
334 for (const auto& t : transactions) {
335 try {
336 amounts.push_back(std::stod(t.amount));
337 } catch (...) {
338 // Skip invalid amounts
339 }
340 }
341
342 if (!amounts.empty()) {
343 double totalAmount = std::accumulate(amounts.begin(), amounts.end(), 0.0);
344 double largest = *std::max_element(amounts.begin(), amounts.end());
345 double smallest = *std::min_element(amounts.begin(), amounts.end());
346
347 std::cout << "Transaction Amount Stats:" << std::endl;
348 std::cout << " Total: $" << std::fixed << std::setprecision(2) << totalAmount << std::endl;
349 std::cout << " Largest: $" << std::fixed << std::setprecision(2) << largest << std::endl;
350 std::cout << " Smallest: $" << std::fixed << std::setprecision(2) << smallest << std::endl;
351 }
352}