@misc{706, keywords = {Blockchain Analytics, Decentralized Finance, Network Science, Data Mining, Distributed Ledger Technologies}, author = {Natkamon Tovanich and Rémy Cazabet and Célestin Coquidé}, title = {Needles in the Haystack : Decoding On-Chain Behavior with Network Science and Data Mining}, abstract = {

We apply network science methodologies to address analytical challenges in blockchain and Decentralized Finance (DeFi). The pseudonymous nature of Bitcoin and the complex, multi-token interactions of Ethereum-based protocols require tools that go beyond traditional blockchain analysis. We present three network-based frameworks for understanding actor behavior and financial activities in these decentralized systems. First, for Bitcoin, we introduce a money flow representation learning approach that encodes taint networks into graph embeddings to identify entities across multiple address clusters. Second, we analyze DeFi activity using ego network motif mining, which extracts recurring structures from token transfer networks. This method can infer transaction methods (e.g., deposits, swaps, borrowing) and characterizes user behavior, even when labels are incomplete or noisy. Third, we model multi-token interactions through a Multilayer Token Network that links cross-token flows. Using PageRank-CheiRank Trade Balance, we quantify accumulation versus dispersion strategies and uncover temporal shifts in trading behavior, illustrated through entities such as Alameda Research. Together, these frameworks show how network topology, motifs, and multilayer flows transform raw blockchain data into interpretable insights on identity, function, and financial strategy.

}, year = {2025}, journal = {Data Mining & Machine Learning (DM2L) Seminar at UMR5205 2025}, month = {12/2025}, address = {Villeurbanne}, doi = {10.34726/11799}, }