@@ -19,14 +19,14 @@ This one-time setup downloads ~120MB of data and prepares it for use.
1919Find entries across all datasets:
2020
2121``` bash
22- # Search for "give" in all datasets
23- glazing search query " give" --data-dir ~ /.local/share/glazing/converted
22+ # Search for "give" in all datasets (uses default data directory)
23+ glazing search query " give"
2424
2525# Search only in VerbNet
26- glazing search query " give" --dataset verbnet --data-dir ~ /.local/share/glazing/converted
26+ glazing search query " give" --dataset verbnet
2727
2828# Get JSON output
29- glazing search query " give" --json --data-dir ~ /.local/share/glazing/converted
29+ glazing search query " give" --json
3030```
3131
3232### Find Cross-References
@@ -35,8 +35,7 @@ Discover connections between datasets:
3535
3636``` bash
3737# Find VerbNet classes for a PropBank roleset
38- glazing search cross-ref --source propbank --target verbnet --id " give.01" \
39- --data-dir ~ /.local/share/glazing/converted
38+ glazing search cross-ref --source propbank --target verbnet --id " give.01"
4039```
4140
4241### Get Dataset Information
@@ -57,13 +56,12 @@ glazing download info verbnet
5756
5857``` python
5958from glazing.search import UnifiedSearch
60- from pathlib import Path
6159
62- # Initialize search with default data directory
60+ # Initialize search (automatically uses default paths)
6361search = UnifiedSearch()
6462
6563# Search across all datasets
66- results = search.search_by_query (" abandon" )
64+ results = search.search (" abandon" )
6765
6866for result in results[:5 ]:
6967 print (f " { result.dataset} : { result.name} " )
@@ -77,32 +75,27 @@ for result in results[:5]:
7775``` python
7876from glazing.framenet.loader import FrameNetLoader
7977from glazing.verbnet.loader import VerbNetLoader
80- from pathlib import Path
8178
82- data_dir = Path.home() / " .local/share/glazing/converted"
83-
84- # Load FrameNet
85- fn_loader = FrameNetLoader()
86- frames = fn_loader.load_frames(data_dir / " framenet.jsonl" )
79+ # Loaders automatically use default paths and load data after 'glazing init'
80+ fn_loader = FrameNetLoader() # Data is already loaded
81+ frames = fn_loader.frames
8782print (f " Loaded { len (frames)} frames " )
8883
89- # Load VerbNet
90- vn_loader = VerbNetLoader()
91- verb_classes = vn_loader.load_verb_classes(data_dir / " verbnet.jsonl" )
84+ vn_loader = VerbNetLoader() # Data is already loaded
85+ verb_classes = list (vn_loader.classes.values())
9286print (f " Loaded { len (verb_classes)} verb classes " )
9387```
9488
9589### Work with VerbNet Classes
9690
9791``` python
9892from glazing.verbnet.loader import VerbNetLoader
99- from pathlib import Path
10093
101- data_dir = Path.home() / " .local/share/glazing/converted "
94+ # Loader automatically uses default path and loads data
10295loader = VerbNetLoader()
10396
104- # Load all verb classes
105- classes = loader.load_verb_classes(data_dir / " verbnet.jsonl " )
97+ # Access already loaded verb classes
98+ classes = list ( loader.classes.values() )
10699
107100# Find a specific class
108101give_class = next (
@@ -125,13 +118,12 @@ if give_class:
125118
126119``` python
127120from glazing.propbank.loader import PropBankLoader
128- from pathlib import Path
129121
130- data_dir = Path.home() / " .local/share/glazing/converted "
122+ # Loader automatically uses default path and loads data
131123loader = PropBankLoader()
132124
133- # Load framesets
134- framesets = loader.load_framesets(data_dir / " propbank.jsonl " )
125+ # Access already loaded framesets
126+ framesets = list ( loader.framesets.values() )
135127
136128# Find rolesets for "give"
137129give_framesets = [fs for fs in framesets if fs.lemma == " give" ]
@@ -149,16 +141,20 @@ for frameset in give_framesets:
149141``` python
150142from glazing.references.extractor import ReferenceExtractor
151143from glazing.references.resolver import ReferenceResolver
152- from pathlib import Path
144+ from glazing.verbnet.loader import VerbNetLoader
145+ from glazing.propbank.loader import PropBankLoader
153146
154- data_dir = Path.home() / " .local/share/glazing/converted"
147+ # Load datasets
148+ vn_loader = VerbNetLoader() # Automatically loads data
149+ pb_loader = PropBankLoader() # Automatically loads data
155150
156- # Extract all references
151+ # Extract references
157152extractor = ReferenceExtractor()
158- references = extractor.extract_from_datasets(data_dir)
153+ extractor.extract_verbnet_references(list (vn_loader.classes.values()))
154+ extractor.extract_propbank_references(list (pb_loader.framesets.values()))
159155
160156# Resolve references for a PropBank roleset
161- resolver = ReferenceResolver(references )
157+ resolver = ReferenceResolver(extractor.mapping_index )
162158related = resolver.resolve(" give.01" , source = " propbank" )
163159
164160print (f " PropBank roleset: give.01 " )
@@ -171,13 +167,10 @@ print(f"WordNet senses: {related.wordnet_senses}")
171167
172168``` python
173169from glazing.wordnet.loader import WordNetLoader
174- from pathlib import Path
175170
176- data_dir = Path.home() / " .local/share/glazing/converted "
171+ # Loader automatically uses default path and loads data
177172loader = WordNetLoader()
178-
179- # Load synsets
180- synsets = loader.load_synsets(data_dir / " wordnet.jsonl" )
173+ synsets = list (loader.synsets.values()) # Already loaded
181174
182175# Find synsets for "dog"
183176dog_synsets = [s for s in synsets if any (
@@ -203,13 +196,12 @@ For memory-efficient processing:
203196
204197``` python
205198from glazing.verbnet.loader import VerbNetLoader
206- from pathlib import Path
207199
208- data_dir = Path.home() / " .local/share/glazing/converted "
209- loader = VerbNetLoader()
200+ # For memory-efficient streaming, use lazy loading
201+ loader = VerbNetLoader(lazy = True , autoload = False )
210202
211203# Stream verb classes one at a time
212- for verb_class in loader.stream_verb_classes(data_dir / " verbnet.jsonl " ):
204+ for verb_class in loader.iter_verb_classes( ):
213205 # Process each class without loading all into memory
214206 if " run" in [m.name for m in verb_class.members]:
215207 print (f " Found 'run' in class: { verb_class.id} " )
@@ -222,10 +214,11 @@ for verb_class in loader.stream_verb_classes(data_dir / "verbnet.jsonl"):
222214
223215``` python
224216from glazing.verbnet.search import VerbNetSearch
225- from pathlib import Path
217+ from glazing.verbnet.loader import VerbNetLoader
226218
227- data_dir = Path.home() / " .local/share/glazing/converted"
228- search = VerbNetSearch(data_dir / " verbnet.jsonl" )
219+ # Loader automatically loads data
220+ loader = VerbNetLoader()
221+ search = VerbNetSearch(list (loader.classes.values()))
229222
230223# Find all classes with an Agent role
231224agent_classes = []
@@ -241,13 +234,10 @@ print(f"Classes with Agent role: {len(agent_classes)}")
241234``` python
242235import json
243236from glazing.framenet.loader import FrameNetLoader
244- from pathlib import Path
245237
246- data_dir = Path.home() / " .local/share/glazing/converted "
238+ # Loader automatically uses default path and loads data
247239loader = FrameNetLoader()
248-
249- # Load frames
250- frames = loader.load_frames(data_dir / " framenet.jsonl" )
240+ frames = loader.frames # Already loaded
251241
252242# Export as simple JSON
253243simple_frames = []
0 commit comments