Skip to content

Commit 7d12ce0

Browse files
Add ZINC datasets
1 parent 9757c50 commit 7d12ce0

File tree

1 file changed

+111
-1
lines changed

1 file changed

+111
-1
lines changed

src/TUDatasets.jl

Lines changed: 111 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -305,6 +305,11 @@ function __init__()
305305
PTC_FRDataset(),
306306
PTC_MMDataset(),
307307
PTC_MRDataset(),
308+
QM9Dataset(),
309+
ZINC_fullDataset(),
310+
ZINC_testDataset(),
311+
ZINC_trainDataset(),
312+
ZINC_valDataset(),
308313
DDDataset(),
309314
ENZYMESDataset(),
310315
PROTEINSDataset(),
@@ -320,7 +325,6 @@ function __init__()
320325
REDDIT_MULTI_5KDataset(),
321326
REDDIT_MULTI_12KDataset(),
322327
COLORS_3Dataset(),
323-
QM9Dataset(),
324328
SYNTHETICDataset(),
325329
SYNTHETICnewDataset(),
326330
SynthieDataset(),
@@ -639,6 +643,112 @@ edge_attributes_type(::QM9Dataset) = NTuple{4, Bool}
639643
graph_attributes_type(::QM9Dataset) = NamedTuple{(, , :ϵ_HOMO, :ϵ_LUMO, :Δϵ, :electronic_spatial_energy,
640644
:ZPVE, :U_0, :U, :H, :G, :c_v, :UATOM_0, :UTAM, :HATOM, :GATOM, :A, :B, :C), NTuple{19, Float64}}
641645

646+
647+
## --------------------------------------
648+
## ZINC_full
649+
## --------------------------------------
650+
651+
struct ZINC_fullDataset <: TUDataset end
652+
653+
dataset_name(::ZINC_fullDataset) = "ZINC_full"
654+
655+
dataset_hash(::ZINC_fullDataset) = "b491cce62afbf5e0febab9ca0bacd0a2458910cefadfd3d93bb6c49b90d62b3c"
656+
657+
readme_name(::ZINC_fullDataset) = "README.txt"
658+
659+
dataset_references(::ZINC_fullDataset) = [31]
660+
661+
edge_labels_type(::ZINC_fullDataset) = @NamedTuple{bond_type::String}
662+
edge_labels_map(::ZINC_fullDataset, i) = ("single", "double", "triple")[i]
663+
664+
node_labels_type(::ZINC_fullDataset) = @NamedTuple{atom_type::String}
665+
node_labels_map(::ZINC_fullDataset, i) = ("C", "O", "N", "F", "C H1", "S", "Cl",
666+
"O -", "N H1 +", "Br", "N H3 +", "N H2 +",
667+
"N +", "N -", "S -", "I", "P", "O H1 +",
668+
"N H1 -", "O +", "S +", "P H1", "P H2", "C H2 -",
669+
"P +", "S H1 +", "C H1 -", "P H1 +")[i + 1]
670+
671+
graph_attributes_type(::ZINC_fullDataset) = Tuple{Float64}
672+
673+
## --------------------------------------
674+
## ZINC_test
675+
## --------------------------------------
676+
677+
struct ZINC_testDataset <: TUDataset end
678+
679+
dataset_name(::ZINC_testDataset) = "ZINC_test"
680+
681+
dataset_hash(::ZINC_testDataset) = "1fe8516fef763cf71238d19a12680ce5cb6a620bbf36134eca8045d6f3e0ed4d"
682+
683+
readme_name(::ZINC_testDataset) = "README.txt"
684+
685+
dataset_references(::ZINC_testDataset) = [31]
686+
687+
edge_labels_type(::ZINC_testDataset) = @NamedTuple{bond_type::String}
688+
edge_labels_map(::ZINC_testDataset, i) = ("single", "double", "triple")[i]
689+
690+
node_labels_type(::ZINC_testDataset) = @NamedTuple{atom_type::String}
691+
node_labels_map(::ZINC_testDataset, i) = ("C", "O", "N", "F", "C H1", "S", "Cl",
692+
"O -", "N H1 +", "Br", "N H3 +", "N H2 +",
693+
"N +", "N -", "S -", "I", "P", "O H1 +",
694+
"N H1 -", "O +", "S +", "P H1", "P H2", "C H2 -",
695+
"P +", "S H1 +", "C H1 -", "P H1 +")[i + 1]
696+
697+
graph_attributes_type(::ZINC_testDataset) = Tuple{Float64}
698+
699+
## --------------------------------------
700+
## ZINC_train
701+
## --------------------------------------
702+
703+
struct ZINC_trainDataset <: TUDataset end
704+
705+
dataset_name(::ZINC_trainDataset) = "ZINC_train"
706+
707+
dataset_hash(::ZINC_testDataset) = "37aa44df9dd9417600c240226d1d847a7b9098c3036c9bf7e2000196cec92bef"
708+
709+
readme_name(::ZINC_trainDataset) = "README.txt"
710+
711+
dataset_references(::ZINC_trainDataset) = [31]
712+
713+
edge_labels_type(::ZINC_trainDataset) = @NamedTuple{bond_type::String}
714+
edge_labels_map(::ZINC_trainDataset, i) = ("single", "double", "triple")[i]
715+
716+
node_labels_type(::ZINC_trainDataset) = @NamedTuple{atom_type::String}
717+
node_labels_map(::ZINC_trainDataset, i) = ("C", "O", "N", "F", "C H1", "S", "Cl",
718+
"O -", "N H1 +", "Br", "N H3 +", "N H2 +",
719+
"N +", "N -", "S -", "I", "P", "O H1 +",
720+
"N H1 -", "O +", "S +", "P H1", "P H2", "C H2 -",
721+
"P +", "S H1 +", "C H1 -", "P H1 +")[i + 1]
722+
723+
graph_attributes_type(::ZINC_trainDataset) = Tuple{Float64}
724+
725+
## --------------------------------------
726+
## ZINC_val
727+
## --------------------------------------
728+
729+
struct ZINC_valDataset <: TUDataset end
730+
731+
dataset_name(::ZINC_valDataset) = "ZINC_val"
732+
733+
dataset_hash(::ZINC_valDataset) = "17b20a99822f17eca9cd6c3e5ac33f41fd42c0ee4dedfd051dac0b0a58f8fa88"
734+
735+
readme_name(::ZINC_valDataset) = "README.txt"
736+
737+
dataset_references(::ZINC_valDataset) = [31]
738+
739+
edge_labels_type(::ZINC_valDataset) = @NamedTuple{bond_type::String}
740+
edge_labels_map(::ZINC_valDataset, i) = ("single", "double", "triple")[i]
741+
742+
node_labels_type(::ZINC_valDataset) = @NamedTuple{atom_type::String}
743+
node_labels_map(::ZINC_valDataset, i) = ("C", "O", "N", "F", "C H1", "S", "Cl",
744+
"O -", "N H1 +", "Br", "N H3 +", "N H2 +",
745+
"N +", "N -", "S -", "I", "P", "O H1 +",
746+
"N H1 -", "O +", "S +", "P H1", "P H2", "C H2 -",
747+
"P +", "S H1 +", "C H1 -", "P H1 +")[i + 1]
748+
749+
graph_attributes_type(::ZINC_valDataset) = Tuple{Float64}
750+
751+
642752
## --------------------------------------
643753
## DD
644754
## --------------------------------------

0 commit comments

Comments
 (0)