from nbdev import *
# %nbdev_default_export data.external
# %nbdev_default_export data.external

True

Extend Configuration

fname = URLs.PETS.split("/")[-1]

c_key='model'
local_path = URLs.LOCAL_PATH/('model' if c_key=='model' else 'data')/fname

local_path

Path('/Landmark2/pdo/Code/ALDAOps/nlphero/nbs/model/oxford-iiit-pet.tgz')

Config().d.keys()

dict_keys(['archive_path', 'data_path', 'model_path', 'storage_path', 'version'])

Config()[c_key]

Path('/Landmark2/pdo/.nlphero/models')

Config()['data']

Path('/Landmark2/pdo/.nlphero/data')

URLs.path()

Path('/home/ubuntu/.fastai/archive')

os.environ["FASTAI_HOME"] = str(Config().config_path.absolute())

URLs.path()

Path('/home/ubuntu/.fastai/archive')

URLs.path()

Path('/home/ubuntu/.fastai/archive')

Extend URL

URLs.path()

Path('/Landmark2/pdo/.nlphero/archive')

Kaggle Dataset Utilities

This is going to be a helper class for downloading Kaggle dataset in required structure

KAGGLEs.path()

Path('/Landmark2/pdo/.nlphero/archive')

URLs.path(URLs.PETS)

Path('/Landmark2/pdo/.nlphero/archive/oxford-iiit-pet.tgz')

URLs.path(URLs.PETS, c_key="data")

Path('/Landmark2/pdo/.nlphero/data/oxford-iiit-pet.tgz')

KAGGLEs.path(KAGGLEs.SPOOKY_AUTHOR_IDENTIFICATION)

Path('/Landmark2/pdo/.nlphero/archive/spooky-author-identification')

KAGGLEs.path(KAGGLEs.SPOOKY)

Path('/Landmark2/pdo/.nlphero/archive/spooky')

KAGGLEs.ktype(KAGGLEs.SPOOKY)

'datasets'

!cat /Landmark2/pdo/.nlphero/config.yml

archive_path: /Landmark2/pdo/.nlphero/archive
data_path: /Landmark2/pdo/.nlphero/data
model_path: /Landmark2/pdo/.nlphero/models
storage_path: /tmp
version: 2

KAGGLEs.SPOOKY

'kaggle_datasets::abhishek/spooky'

KAGGLEs.SPOOKY.startswith("kaggle")

True

is_kaggle = KAGGLEs.SPOOKY.startswith("kaggle")
T = [URLs, KAGGLEs][is_kaggle]
T

__main__.KAGGLEs

URLs

__main__.URLs

T.path()

Path('/Landmark2/pdo/.nlphero/archive')

c_key='data'
# url = KAGGLEs.SPOOKY
url = URLs.PETS
is_kaggle =url.startswith("kaggle")
T = [URLs, KAGGLEs][is_kaggle]
dest=None
fname = None
default_dest = T.path(url, c_key=c_key).with_suffix('')
dest = default_dest if dest is None else Path(dest)/default_dest.name
fname = Path(fname or T.path(url))

default_dest

Path('/Landmark2/pdo/.nlphero/data/oxford-iiit-pet')

dest.parent

Path('/Landmark2/pdo/.nlphero/data')

fname.suffix

'.tgz'

# pd.DataFrame([path.name for path in KAGGLEs.path(c_key='data').ls()])

print("Check")

Check

Bing Image Dataset Utilities

('/Landmark2/pdo/.nlphero/data', '/Landmark2/pdo/.nlphero/data')

# loc =os.path.join(os.getenv("NLPHERO_HOME"), "data")
# if Path(loc).exists(): print(list_ds(loc))

clstypes = "Sarah Shahi", "Mercedes Masohn", "Jeffrey Dean Morgan", "Javier Bardem", "Benicio Del Toro", "Brad Pitt"
dest = "DoppelgangerMixed"
count=150

data external

Extend Configuration

`class` `Config`[source]

Extend URL

`class` `URLs`[source]

Kaggle Dataset Utilities

`class` `KAGGLEs`[source]

`download_kaggle`[source]

`download_data`[source]

`untar_data`[source]

`list_checked_data`[source]

Bing Image Dataset Utilities

`search_images_bing`[source]

`construct_image_dataset`[source]

`list_ds`[source]

`get_ds`[source]

data external

Extend Configuration

class Config[source]

Extend URL

class URLs[source]

Kaggle Dataset Utilities

class KAGGLEs[source]

download_kaggle[source]

download_data[source]

untar_data[source]

list_checked_data[source]

Bing Image Dataset Utilities

search_images_bing[source]

construct_image_dataset[source]

list_ds[source]

get_ds[source]

`class` `Config`[source]

`class` `URLs`[source]

`class` `KAGGLEs`[source]

`download_kaggle`[source]

`download_data`[source]

`untar_data`[source]

`list_checked_data`[source]

`search_images_bing`[source]

`construct_image_dataset`[source]

`list_ds`[source]

`get_ds`[source]