Merge pull request #2306 from mempool/nymkappa/bugfix/stats-import
Refactor LN stats import
This commit is contained in:
		
						commit
						50d99634f7
					
				
							
								
								
									
										34
									
								
								backend/package-lock.json
									
									
									
										generated
									
									
									
								
							
							
						
						
									
										34
									
								
								backend/package-lock.json
									
									
									
										generated
									
									
									
								
							| @ -16,7 +16,6 @@ | |||||||
|         "bitcoinjs-lib": "6.0.2", |         "bitcoinjs-lib": "6.0.2", | ||||||
|         "crypto-js": "^4.0.0", |         "crypto-js": "^4.0.0", | ||||||
|         "express": "^4.18.0", |         "express": "^4.18.0", | ||||||
|         "fast-xml-parser": "^4.0.9", |  | ||||||
|         "maxmind": "^4.3.6", |         "maxmind": "^4.3.6", | ||||||
|         "mysql2": "2.3.3", |         "mysql2": "2.3.3", | ||||||
|         "node-worker-threads-pool": "^1.5.1", |         "node-worker-threads-pool": "^1.5.1", | ||||||
| @ -3136,21 +3135,6 @@ | |||||||
|       "integrity": "sha512-DCXu6Ifhqcks7TZKY3Hxp3y6qphY5SJZmrWMDrKcERSOXWQdMhU9Ig/PYrzyw/ul9jOIyh0N4M0tbC5hodg8dw==", |       "integrity": "sha512-DCXu6Ifhqcks7TZKY3Hxp3y6qphY5SJZmrWMDrKcERSOXWQdMhU9Ig/PYrzyw/ul9jOIyh0N4M0tbC5hodg8dw==", | ||||||
|       "dev": true |       "dev": true | ||||||
|     }, |     }, | ||||||
|     "node_modules/fast-xml-parser": { |  | ||||||
|       "version": "4.0.9", |  | ||||||
|       "resolved": "https://registry.npmjs.org/fast-xml-parser/-/fast-xml-parser-4.0.9.tgz", |  | ||||||
|       "integrity": "sha512-4G8EzDg2Nb1Qurs3f7BpFV4+jpMVsdgLVuG1Uv8O2OHJfVCg7gcA53obuKbmVqzd4Y7YXVBK05oJG7hzGIdyzg==", |  | ||||||
|       "dependencies": { |  | ||||||
|         "strnum": "^1.0.5" |  | ||||||
|       }, |  | ||||||
|       "bin": { |  | ||||||
|         "fxparser": "src/cli/cli.js" |  | ||||||
|       }, |  | ||||||
|       "funding": { |  | ||||||
|         "type": "paypal", |  | ||||||
|         "url": "https://paypal.me/naturalintelligence" |  | ||||||
|       } |  | ||||||
|     }, |  | ||||||
|     "node_modules/fastq": { |     "node_modules/fastq": { | ||||||
|       "version": "1.13.0", |       "version": "1.13.0", | ||||||
|       "resolved": "https://registry.npmjs.org/fastq/-/fastq-1.13.0.tgz", |       "resolved": "https://registry.npmjs.org/fastq/-/fastq-1.13.0.tgz", | ||||||
| @ -5636,11 +5620,6 @@ | |||||||
|         "url": "https://github.com/sponsors/sindresorhus" |         "url": "https://github.com/sponsors/sindresorhus" | ||||||
|       } |       } | ||||||
|     }, |     }, | ||||||
|     "node_modules/strnum": { |  | ||||||
|       "version": "1.0.5", |  | ||||||
|       "resolved": "https://registry.npmjs.org/strnum/-/strnum-1.0.5.tgz", |  | ||||||
|       "integrity": "sha512-J8bbNyKKXl5qYcR36TIO8W3mVGVHrmmxsd5PAItGkmyzwJvybiw2IVq5nqd0i4LSNSkB/sx9VHllbfFdr9k1JA==" |  | ||||||
|     }, |  | ||||||
|     "node_modules/supports-color": { |     "node_modules/supports-color": { | ||||||
|       "version": "7.2.0", |       "version": "7.2.0", | ||||||
|       "resolved": "https://registry.npmjs.org/supports-color/-/supports-color-7.2.0.tgz", |       "resolved": "https://registry.npmjs.org/supports-color/-/supports-color-7.2.0.tgz", | ||||||
| @ -8556,14 +8535,6 @@ | |||||||
|       "integrity": "sha512-DCXu6Ifhqcks7TZKY3Hxp3y6qphY5SJZmrWMDrKcERSOXWQdMhU9Ig/PYrzyw/ul9jOIyh0N4M0tbC5hodg8dw==", |       "integrity": "sha512-DCXu6Ifhqcks7TZKY3Hxp3y6qphY5SJZmrWMDrKcERSOXWQdMhU9Ig/PYrzyw/ul9jOIyh0N4M0tbC5hodg8dw==", | ||||||
|       "dev": true |       "dev": true | ||||||
|     }, |     }, | ||||||
|     "fast-xml-parser": { |  | ||||||
|       "version": "4.0.9", |  | ||||||
|       "resolved": "https://registry.npmjs.org/fast-xml-parser/-/fast-xml-parser-4.0.9.tgz", |  | ||||||
|       "integrity": "sha512-4G8EzDg2Nb1Qurs3f7BpFV4+jpMVsdgLVuG1Uv8O2OHJfVCg7gcA53obuKbmVqzd4Y7YXVBK05oJG7hzGIdyzg==", |  | ||||||
|       "requires": { |  | ||||||
|         "strnum": "^1.0.5" |  | ||||||
|       } |  | ||||||
|     }, |  | ||||||
|     "fastq": { |     "fastq": { | ||||||
|       "version": "1.13.0", |       "version": "1.13.0", | ||||||
|       "resolved": "https://registry.npmjs.org/fastq/-/fastq-1.13.0.tgz", |       "resolved": "https://registry.npmjs.org/fastq/-/fastq-1.13.0.tgz", | ||||||
| @ -10398,11 +10369,6 @@ | |||||||
|       "integrity": "sha512-6fPc+R4ihwqP6N/aIv2f1gMH8lOVtWQHoqC4yK6oSDVVocumAsfCqjkXnqiYMhmMwS/mEHLp7Vehlt3ql6lEig==", |       "integrity": "sha512-6fPc+R4ihwqP6N/aIv2f1gMH8lOVtWQHoqC4yK6oSDVVocumAsfCqjkXnqiYMhmMwS/mEHLp7Vehlt3ql6lEig==", | ||||||
|       "dev": true |       "dev": true | ||||||
|     }, |     }, | ||||||
|     "strnum": { |  | ||||||
|       "version": "1.0.5", |  | ||||||
|       "resolved": "https://registry.npmjs.org/strnum/-/strnum-1.0.5.tgz", |  | ||||||
|       "integrity": "sha512-J8bbNyKKXl5qYcR36TIO8W3mVGVHrmmxsd5PAItGkmyzwJvybiw2IVq5nqd0i4LSNSkB/sx9VHllbfFdr9k1JA==" |  | ||||||
|     }, |  | ||||||
|     "supports-color": { |     "supports-color": { | ||||||
|       "version": "7.2.0", |       "version": "7.2.0", | ||||||
|       "resolved": "https://registry.npmjs.org/supports-color/-/supports-color-7.2.0.tgz", |       "resolved": "https://registry.npmjs.org/supports-color/-/supports-color-7.2.0.tgz", | ||||||
|  | |||||||
| @ -38,7 +38,6 @@ | |||||||
|     "bitcoinjs-lib": "6.0.2", |     "bitcoinjs-lib": "6.0.2", | ||||||
|     "crypto-js": "^4.0.0", |     "crypto-js": "^4.0.0", | ||||||
|     "express": "^4.18.0", |     "express": "^4.18.0", | ||||||
|     "fast-xml-parser": "^4.0.9", |  | ||||||
|     "maxmind": "^4.3.6", |     "maxmind": "^4.3.6", | ||||||
|     "mysql2": "2.3.3", |     "mysql2": "2.3.3", | ||||||
|     "node-worker-threads-pool": "^1.5.1", |     "node-worker-threads-pool": "^1.5.1", | ||||||
|  | |||||||
| @ -1,6 +1,5 @@ | |||||||
| import DB from '../../../database'; | import DB from '../../../database'; | ||||||
| import { promises } from 'fs'; | import { promises } from 'fs'; | ||||||
| import { XMLParser } from 'fast-xml-parser'; |  | ||||||
| import logger from '../../../logger'; | import logger from '../../../logger'; | ||||||
| import fundingTxFetcher from './funding-tx-fetcher'; | import fundingTxFetcher from './funding-tx-fetcher'; | ||||||
| import config from '../../../config'; | import config from '../../../config'; | ||||||
| @ -35,11 +34,8 @@ interface Channel { | |||||||
| 
 | 
 | ||||||
| class LightningStatsImporter { | class LightningStatsImporter { | ||||||
|   topologiesFolder = config.LIGHTNING.TOPOLOGY_FOLDER; |   topologiesFolder = config.LIGHTNING.TOPOLOGY_FOLDER; | ||||||
|   parser = new XMLParser(); |  | ||||||
| 
 | 
 | ||||||
|   async $run(): Promise<void> { |   async $run(): Promise<void> { | ||||||
|     logger.info(`Importing historical lightning stats`); |  | ||||||
| 
 |  | ||||||
|     const [channels]: any[] = await DB.query('SELECT short_id from channels;'); |     const [channels]: any[] = await DB.query('SELECT short_id from channels;'); | ||||||
|     logger.info('Caching funding txs for currently existing channels'); |     logger.info('Caching funding txs for currently existing channels'); | ||||||
|     await fundingTxFetcher.$fetchChannelsFundingTxs(channels.map(channel => channel.short_id)); |     await fundingTxFetcher.$fetchChannelsFundingTxs(channels.map(channel => channel.short_id)); | ||||||
| @ -63,6 +59,9 @@ class LightningStatsImporter { | |||||||
|       let isUnnanounced = true; |       let isUnnanounced = true; | ||||||
| 
 | 
 | ||||||
|       for (const socket of (node.addresses ?? [])) { |       for (const socket of (node.addresses ?? [])) { | ||||||
|  |         if (!socket.network?.length || !socket.addr?.length) { | ||||||
|  |           continue; | ||||||
|  |         } | ||||||
|         hasOnion = hasOnion || ['torv2', 'torv3'].includes(socket.network) || socket.addr.indexOf('onion') !== -1; |         hasOnion = hasOnion || ['torv2', 'torv3'].includes(socket.network) || socket.addr.indexOf('onion') !== -1; | ||||||
|         hasClearnet = hasClearnet || ['ipv4', 'ipv6'].includes(socket.network) || [4, 6].includes(isIP(socket.addr.split(':')[0])); |         hasClearnet = hasClearnet || ['ipv4', 'ipv6'].includes(socket.network) || [4, 6].includes(isIP(socket.addr.split(':')[0])); | ||||||
|       } |       } | ||||||
| @ -263,8 +262,6 @@ class LightningStatsImporter { | |||||||
|    * Import topology files LN historical data into the database |    * Import topology files LN historical data into the database | ||||||
|    */ |    */ | ||||||
|   async $importHistoricalLightningStats(): Promise<void> { |   async $importHistoricalLightningStats(): Promise<void> { | ||||||
|     let latestNodeCount = 1; |  | ||||||
| 
 |  | ||||||
|     const fileList = await fsPromises.readdir(this.topologiesFolder); |     const fileList = await fsPromises.readdir(this.topologiesFolder); | ||||||
|     // Insert history from the most recent to the oldest
 |     // Insert history from the most recent to the oldest
 | ||||||
|     // This also put the .json cached files first
 |     // This also put the .json cached files first
 | ||||||
| @ -282,55 +279,51 @@ class LightningStatsImporter { | |||||||
| 
 | 
 | ||||||
|     // For logging purpose
 |     // For logging purpose
 | ||||||
|     let processed = 10; |     let processed = 10; | ||||||
|     let totalProcessed = -1; |     let totalProcessed = 0; | ||||||
|  |     let logStarted = false; | ||||||
| 
 | 
 | ||||||
|     for (const filename of fileList) { |     for (const filename of fileList) { | ||||||
|       processed++; |       processed++; | ||||||
|       totalProcessed++; |  | ||||||
| 
 | 
 | ||||||
|       const timestamp = parseInt(filename.split('_')[1], 10); |       const timestamp = parseInt(filename.split('_')[1], 10); | ||||||
| 
 | 
 | ||||||
|       // Stats exist already, don't calculate/insert them
 |       // Stats exist already, don't calculate/insert them
 | ||||||
|       if (existingStatsTimestamps[timestamp] !== undefined) { |       if (existingStatsTimestamps[timestamp] !== undefined) { | ||||||
|         latestNodeCount = existingStatsTimestamps[timestamp].node_count; |         continue; | ||||||
|  |       } | ||||||
|  | 
 | ||||||
|  |       if (filename.indexOf('.topology') === -1) { | ||||||
|         continue; |         continue; | ||||||
|       } |       } | ||||||
| 
 | 
 | ||||||
|       logger.debug(`Reading ${this.topologiesFolder}/${filename}`); |       logger.debug(`Reading ${this.topologiesFolder}/${filename}`); | ||||||
|       const fileContent = await fsPromises.readFile(`${this.topologiesFolder}/${filename}`, 'utf8'); |       let fileContent = ''; | ||||||
|  |       try { | ||||||
|  |         fileContent = await fsPromises.readFile(`${this.topologiesFolder}/${filename}`, 'utf8'); | ||||||
|  |       } catch (e: any) { | ||||||
|  |         if (e.errno == -1) { // EISDIR - Ignore directorie
 | ||||||
|  |           continue; | ||||||
|  |         } | ||||||
|  |       } | ||||||
| 
 | 
 | ||||||
|       let graph; |       let graph; | ||||||
|       if (filename.indexOf('.json') !== -1) { |       try { | ||||||
|         try { |         graph = JSON.parse(fileContent); | ||||||
|           graph = JSON.parse(fileContent); |       } catch (e) { | ||||||
|         } catch (e) { |         logger.debug(`Invalid topology file ${this.topologiesFolder}/${filename}, cannot parse the content`); | ||||||
|           logger.debug(`Invalid topology file ${this.topologiesFolder}/${filename}, cannot parse the content`); |         continue; | ||||||
|           continue; |  | ||||||
|         } |  | ||||||
|       } else { |  | ||||||
|         graph = this.parseFile(fileContent); |  | ||||||
|         if (!graph) { |  | ||||||
|           logger.debug(`Invalid topology file ${this.topologiesFolder}/${filename}, cannot parse the content`); |  | ||||||
|           continue; |  | ||||||
|         } |  | ||||||
|         await fsPromises.writeFile(`${this.topologiesFolder}/${filename}.json`, JSON.stringify(graph)); |  | ||||||
|       } |       } | ||||||
| 
 |    | ||||||
|       if (timestamp > 1556316000) { |       if (!logStarted) { | ||||||
|         // "No, the reason most likely is just that I started collection in 2019,
 |         logger.info(`Founds a topology file that we did not import. Importing historical lightning stats now.`); | ||||||
|         // so what I had before that is just the survivors from before, which weren't that many"
 |         logStarted = true; | ||||||
|         const diffRatio = graph.nodes.length / latestNodeCount; |  | ||||||
|         if (diffRatio < 0.9) { |  | ||||||
|           // Ignore drop of more than 90% of the node count as it's probably a missing data point
 |  | ||||||
|           logger.debug(`Nodes count diff ratio threshold reached, ignore the data for this day ${graph.nodes.length} nodes vs ${latestNodeCount}`); |  | ||||||
|           continue; |  | ||||||
|         } |  | ||||||
|       } |       } | ||||||
|       latestNodeCount = graph.nodes.length; |        | ||||||
| 
 |  | ||||||
|       const datestr = `${new Date(timestamp * 1000).toUTCString()} (${timestamp})`; |       const datestr = `${new Date(timestamp * 1000).toUTCString()} (${timestamp})`; | ||||||
|       logger.debug(`${datestr}: Found ${graph.nodes.length} nodes and ${graph.edges.length} channels`); |       logger.debug(`${datestr}: Found ${graph.nodes.length} nodes and ${graph.edges.length} channels`); | ||||||
| 
 | 
 | ||||||
|  |       totalProcessed++; | ||||||
|  | 
 | ||||||
|       if (processed > 10) { |       if (processed > 10) { | ||||||
|         logger.info(`Generating LN network stats for ${datestr}. Processed ${totalProcessed}/${fileList.length} files`); |         logger.info(`Generating LN network stats for ${datestr}. Processed ${totalProcessed}/${fileList.length} files`); | ||||||
|         processed = 0; |         processed = 0; | ||||||
| @ -343,76 +336,9 @@ class LightningStatsImporter { | |||||||
|       existingStatsTimestamps[timestamp] = stat; |       existingStatsTimestamps[timestamp] = stat; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     logger.info(`Lightning network stats historical import completed`); |     if (totalProcessed > 0) { | ||||||
|   } |       logger.info(`Lightning network stats historical import completed`); | ||||||
| 
 |  | ||||||
|   /** |  | ||||||
|    * Parse the file content into XML, and return a list of nodes and channels |  | ||||||
|    */ |  | ||||||
|   private parseFile(fileContent): any { |  | ||||||
|     const graph = this.parser.parse(fileContent); |  | ||||||
|     if (Object.keys(graph).length === 0) { |  | ||||||
|       return null; |  | ||||||
|     } |     } | ||||||
| 
 |  | ||||||
|     const nodes: Node[] = []; |  | ||||||
|     const channels: Channel[] = []; |  | ||||||
| 
 |  | ||||||
|     // If there is only one entry, the parser does not return an array, so we override this
 |  | ||||||
|     if (!Array.isArray(graph.graphml.graph.node)) { |  | ||||||
|       graph.graphml.graph.node = [graph.graphml.graph.node]; |  | ||||||
|     } |  | ||||||
|     if (!Array.isArray(graph.graphml.graph.edge)) { |  | ||||||
|       graph.graphml.graph.edge = [graph.graphml.graph.edge]; |  | ||||||
|     } |  | ||||||
| 
 |  | ||||||
|     for (const node of graph.graphml.graph.node) { |  | ||||||
|       if (!node.data) { |  | ||||||
|         continue; |  | ||||||
|       } |  | ||||||
|       const addresses: unknown[] = []; |  | ||||||
|       const sockets = node.data[5].split(','); |  | ||||||
|       for (const socket of sockets) { |  | ||||||
|         const parts = socket.split('://'); |  | ||||||
|         addresses.push({ |  | ||||||
|           network: parts[0], |  | ||||||
|           addr: parts[1], |  | ||||||
|         }); |  | ||||||
|       } |  | ||||||
|       nodes.push({ |  | ||||||
|         id: node.data[0], |  | ||||||
|         timestamp: node.data[1], |  | ||||||
|         features: node.data[2], |  | ||||||
|         rgb_color: node.data[3], |  | ||||||
|         alias: node.data[4], |  | ||||||
|         addresses: addresses, |  | ||||||
|         out_degree: node.data[6], |  | ||||||
|         in_degree: node.data[7], |  | ||||||
|       }); |  | ||||||
|     } |  | ||||||
| 
 |  | ||||||
|     for (const channel of graph.graphml.graph.edge) { |  | ||||||
|       if (!channel.data) { |  | ||||||
|         continue; |  | ||||||
|       } |  | ||||||
|       channels.push({ |  | ||||||
|         channel_id: channel.data[0], |  | ||||||
|         node1_pub: channel.data[1], |  | ||||||
|         node2_pub: channel.data[2], |  | ||||||
|         timestamp: channel.data[3], |  | ||||||
|         features: channel.data[4], |  | ||||||
|         fee_base_msat: channel.data[5], |  | ||||||
|         fee_rate_milli_msat: channel.data[6], |  | ||||||
|         htlc_minimim_msat: channel.data[7], |  | ||||||
|         cltv_expiry_delta: channel.data[8], |  | ||||||
|         htlc_maximum_msat: channel.data[9], |  | ||||||
|       }); |  | ||||||
|     } |  | ||||||
| 
 |  | ||||||
|     return { |  | ||||||
|       nodes: nodes, |  | ||||||
|       edges: channels, |  | ||||||
|     }; |  | ||||||
|   } |   } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user