import sys

def install_packages():
    in_snowflake_notebook = "snowbook" in sys.modules
    if in_snowflake_notebook:
        sys.path.append("./relationalai.zip")
        print("Install matplotlib from package dropdown.")
    else:
        import os
        os.system('pip install relationalai matplotlib')

install_packages()

import relationalai as rai
from relationalai.std.graphs import Graph
from relationalai import std
from relationalai.std import alias
from relationalai.std.aggregates import count, sum, max, top

import matplotlib as mpl
from typing import Tuple

provider = rai.Provider()

provider.sql("""
create database if not exists RAI_DEMO;
create schema if not exists RAI_DEMO.MONEY_FLOW;

create or replace table RAI_DEMO.MONEY_FLOW.USER_TRANSACTIONS (
	USER1_ID NUMBER(18,0),
	USER2_ID NUMBER(18,0),
	AMOUNT NUMBER(18,0)
);

insert into RAI_DEMO.MONEY_FLOW.USER_TRANSACTIONS (USER1_ID, USER2_ID, AMOUNT) VALUES
(1,2,1766),
(1,2,338),
(1,2,504),
(1,2,504),
(1,3,4202),
(1,4,693),
(2,5,828),
(1,6,772),
(13,10,806),
(9,6,241),
(12,17,738),
(16,9,415),
(5,1,1086),
(15,12,684),
(3,2,996),
(20,3,766),
(17,15,167),
(15,3,794),
(19,12,956),
(14,12,654),
(15,14,891),
(3,14,1668),
(1,4,916),
(18,7,142),
(20,9,212),
(6,9,781),
(13,2,828),
(4,3,646),
(4,8,794),
(15,17,191),
(9,2,276),
(18,16,651),
(20,2,306),
(6,5,195),
(20,11,536),
(8,15,327),
(15,19,772),
(4,18,782),
(3,2,610),
(20,14,693),
(5,16,338);
""")

provider.create_streams(
    ["RAI_DEMO.MONEY_FLOW.USER_TRANSACTIONS"],
    "money_trail",
)

model = rai.Model("money_trail")

Transaction = model.Type("Transaction", source="rai_demo.money_flow.user_transactions")

Transaction.known_properties()

['snowflake_id', 'amount', 'user2_id', 'user1_id']

# count number of transactions
with model.query() as select:
    t = Transaction()
    response = select(alias(count(t), 'nr. transactions'))
response

# show first 5 transactions
with model.query() as select:
    t = Transaction()
    top(5, t)
    response = select(t.user1_id, t.user2_id, t.amount)
response

User = model.Type("User")

with model.rule():
    t = Transaction()
    t.set(src = User.add(id=t.user1_id),
          dst = User.add(id=t.user2_id))

input_graph = Graph(model)
Node, Edge = input_graph.Node, input_graph.Edge

Node.extend(User, label=User.id, hover=User.id)

with model.rule():
    t = Transaction()
    Edge.add(t.src, t.dst)

input_graph.visualize().display(inline=True)

with model.rule():
    u = User()
    t = Transaction(dst = u)
    u.set(txn_received = count(t, per = [t.dst]))

with model.rule():
    u = User()
    t = Transaction(src = u)
    u.set(txn_sent = count(t, per = [t.src]))

with model.rule():
    u = User()
    u.set(total_txn_count = u.txn_sent.or_(0) + u.txn_received.or_(0))

with model.query() as select:
    u = User()
    top(10, u.txn_received, u)
    result = select(u.id, u.txn_sent.or_(0), u.txn_received.or_(0))
result

with model.rule():
    t = Transaction()
    t.set(total_received = count(t, per=[t.dst, t.src]))

with model.query() as select:
    t = Transaction()
    top(10, t.total_received, t)
    result = select(alias(t.dst.id, 'receiver'), alias(t.src.id, 'sender'), t.total_received)
result

StrongConnection = model.Type("StrongConnection")

with model.rule():
    t = Transaction()
    t.total_received > 1
    t.set(StrongConnection)

txn_ct_graph = Graph(model, weighted=True)
Node, Edge = txn_ct_graph.Node, txn_ct_graph.Edge

Node.extend(User, label=User.id)

# We clearly want to indicate strong connections and therefore set both the color and the size of those edges.
with model.rule():
    t = Transaction()
    sc = StrongConnection()
    Edge.add(t.src, t.dst, hover=t.total_received)
    Edge.add(sc.src, sc.dst, color = 'red', size=t.total_received * 3)

txn_ct_graph.visualize().display(inline=True)

with model.rule():
    t = Transaction()
    t.set(total_volume = sum(t.amount, per=[t.src, t.dst]))

with model.rule():
    u = User()
    t = Transaction(dst = u)
    u.set(total_amt_received = sum(t.total_volume, per=[t.dst]))

with model.rule():
    u = User()
    t = Transaction(src = u)
    u.set(total_amt_sent = sum(t.total_volume, per=[t.src]))

with model.query() as select:
    u = User()
    tr = u.total_amt_received.or_(0)
    ts = u.total_amt_sent.or_(0)
    diff = ts - tr
    top(10, -diff, u)
    result = select(u.id, alias(ts, 'total amount sent'), alias(tr, 'total amt received'), alias(diff, 'net amount'))
result

tv_graph = Graph(model, weighted=True, undirected=False)
Node, Edge = tv_graph.Node, tv_graph.Edge

Node.extend(User, label=User.id)

# We set the transaction amount as the size property of each edge
with model.rule():
    t = Transaction()
    sc = StrongConnection()
    Edge.add(t.src, t.dst, size=t.total_volume/300, hover=t.total_volume)
    Edge.add(sc.src, sc.dst, color = 'red')

tv_graph.visualize().display(inline=True)

infomap_graph = Graph(model)
Node, Edge = infomap_graph.Node, infomap_graph.Edge

Node.extend(User, label=User.id)

# We set the transaction amount as the size property of each edge
with model.rule():
    t = Transaction()
    Edge.add(t.src, t.dst, size=t.total_volume/300, hover=t.total_volume)

with model.rule():
    u = User()
    community = infomap_graph.compute.infomap(u)
    u.set(community = community)
    Node(u).set(community = community)

with model.query() as select:
    u = User()
    c = count(u, per=[u.community])
    result = select.distinct(u.community, alias(c, 'user count'))

result

def color_nodes(graph, by: str, cmap = mpl.cm.rainbow, default: str = "black"):
    # Normalize the values of the property `by` to [0, 1] and set
    # the `color` property` of each node to the normalized value.
    with graph.model.rule():
        node = graph.Node()
        prop = getattr(node, by)
        min_ = std.aggregates.min(prop)
        max_ = std.aggregates.max(prop)
        normalized = (prop - min_) / (max_ - min_)
        node.set(color=normalized)

    # Define a function that returns the color of a node based on
    # its `color` property. Colors are determined by the `cmap`
    # colormap. If a node does not have the `color` property,
    # the`default` color is returned.
    def _color(node):
        if node.get("color") is not None:
            return mpl.colors.to_hex(cmap(node['color']))
        else:
             return default

    return _color

infomap_graph.visualize(node_size_factor = 2, style={"node": {"color": color_nodes(infomap_graph, by="community") }}).display(inline=True)

weighted_tv_graph = Graph(model, undirected=True, weighted=True)
Node, Edge = weighted_tv_graph.Node, weighted_tv_graph.Edge

# We set the sum of the transaction volumes between two users as the weight of the edge between them
with model.rule():
    t = Transaction()
    with model.case():
        with model.not_found():
            Transaction(src=t.dst, dst=t.src)
        Edge.add(t.src, t.dst, weight=t.total_volume, size=t.total_volume/1000, hover=t.total_volume)
    with model.case():
        total_volume = t.total_volume + Transaction(src=t.dst, dst=t.src).total_volume
        Edge.add(t.src, t.dst, weight=total_volume, size=total_volume/1000, hover=total_volume)

with model.rule():
    u = User()
    Node.add(u, label=u.id, hover = u.ctr_by_tv,  community=u.community)

with model.rule():
    u = User()
    ctr_by_tv = weighted_tv_graph.compute.eigenvector_centrality(u)
    # We set the centrality as a property of the node
    Node(u).set(ctr_by_tv=ctr_by_tv, size=ctr_by_tv*200)
    u.set(ctr_by_tv=ctr_by_tv)

with model.query() as select:
    u = User()
    top(10, u.ctr_by_tv, u)
    result = select(alias(u.id, "user"), alias(u.ctr_by_tv, "eigenvector score by txn volume"))
result

weighted_tv_graph.visualize(node_size_factor = 0.75, style={"node": {"color": color_nodes(weighted_tv_graph, by="community") }}).display(inline=True)

HighScoringUser = model.Type('HighScoringUser')

with model.rule():
    u = User()
    max_score = max(u.ctr_by_tv, per=[u.community])
    u.ctr_by_tv == max_score
    u.set(HighScoringUser)


with model.query() as select:
    u = HighScoringUser()
    result = select(u.community,alias(u.id, "user"), alias(u.ctr_by_tv, "eigenvector score by txn volume"))
result

@model.export("rai_demo.money_flow")
def get_high_scoring_users() -> Tuple[int]:
    u = HighScoringUser()
    return u.id

user	eigenvector score by txn volume
1	0.609837
2	0.410369
3	0.572984
4	0.210352
5	0.154048
6	0.080669
13	0.051982
14	0.171205
15	0.098477
20	0.104724

Understanding Customer Behavior using Knowledge Graphs

Let's get started!

Importing Packages

Importing data from Snowflake

Getting to know the input data

Weaving data into the model

Visualizing the input data

Enriching the graph with additional knowledge

Knowledge gained by counting transactions

Visualizing Strong Connections

Identifying the most valuable relationships using the `sum` aggregation

Community Detection using Infomap

Detecting influential users

Detecting influential users based on transaction volume

Extending visualization with eigenvector score

Selecting Users for Targeted Campaigns

Create stored procedure

id	total amount sent	total amt received	net amount
2	828	5624	-4796
3	3274	6408	-3134
8	327	794	-467
9	517	1408	-891
10	0	806	-806
11	0	536	-536
12	738	2294	-1556
14	654	3252	-2598
16	415	989	-574
17	167	929	-762

user1_id	user2_id	amount
5	1	1086
5	16	338
20	3	766
20	9	212
20	14	693

id	txn_sent	txn_received
2	1	9
3	3	4
4	3	2
6	2	2
9	2	3
12	1	3
14	1	3
15	5	2
16	1	2
17	1	2

receiver	sender	total_received
1	5	1
2	1	4
2	1	4
2	1	4
2	1	4
2	3	2
2	3	2
3	20	1
4	1	2
4	1	2

Understanding Customer Behavior using Knowledge Graphs

Let's get started!

Importing Packages

Importing data from Snowflake

Getting to know the input data

Weaving data into the model

Visualizing the input data

Enriching the graph with additional knowledge

Knowledge gained by counting transactions

Visualizing Strong Connections

Identifying the most valuable relationships using the sum aggregation

Community Detection using Infomap

Detecting influential users

Detecting influential users based on transaction volume

Extending visualization with eigenvector score

Selecting Users for Targeted Campaigns

Create stored procedure

Identifying the most valuable relationships using the `sum` aggregation