- prediction/image/ FastAPI 서버 Docker 환경 구성 - Dockerfile: PyTorch 2.1 + CUDA 12.1 기반 GPU 이미지 - docker-compose.yml: GPU 할당 + 데이터 볼륨 마운트 - requirements.txt: 서버 의존성 목록 - .env.example: 환경변수 템플릿 - DOCKER_USAGE.md: 빌드/실행/API 사용법 문서 - Dockerfile에 .dockerignore 제외 폴더 mkdir -p 추가 - .gitignore: prediction/image 결과물 및 모델 가중치(.pth) 제외 추가 - dbInsert_csv.py, dbInsert_shp.py 삭제 (미사용 DB 로직) - api.py: dbInsert import 및 주석 처리된 DB 호출 코드 제거 - aerialRouter.ts: req.params 타입 오류 수정
82 lines
2.7 KiB
Python
82 lines
2.7 KiB
Python
# Copyright (c) OpenMMLab. All rights reserved.
|
|
import mmcv
|
|
import torch
|
|
from mmcv.parallel import MMDataParallel, MMDistributedDataParallel
|
|
|
|
from mmseg import digit_version
|
|
|
|
dp_factory = {'cuda': MMDataParallel, 'cpu': MMDataParallel}
|
|
|
|
ddp_factory = {'cuda': MMDistributedDataParallel}
|
|
|
|
|
|
def build_dp(model, device='cuda', dim=0, *args, **kwargs):
|
|
"""build DataParallel module by device type.
|
|
|
|
if device is cuda, return a MMDataParallel module; if device is mlu,
|
|
return a MLUDataParallel module.
|
|
|
|
Args:
|
|
model (:class:`nn.Module`): module to be parallelized.
|
|
device (str): device type, cuda, cpu or mlu. Defaults to cuda.
|
|
dim (int): Dimension used to scatter the data. Defaults to 0.
|
|
|
|
Returns:
|
|
:class:`nn.Module`: parallelized module.
|
|
"""
|
|
if device == 'cuda':
|
|
model = model.cuda()
|
|
elif device == 'mlu':
|
|
assert digit_version(mmcv.__version__) >= digit_version('1.5.0'), \
|
|
'Please use MMCV >= 1.5.0 for MLU training!'
|
|
from mmcv.device.mlu import MLUDataParallel
|
|
dp_factory['mlu'] = MLUDataParallel
|
|
model = model.mlu()
|
|
|
|
return dp_factory[device](model, dim=dim, *args, **kwargs)
|
|
|
|
|
|
def build_ddp(model, device='cuda', *args, **kwargs):
|
|
"""Build DistributedDataParallel module by device type.
|
|
|
|
If device is cuda, return a MMDistributedDataParallel module;
|
|
if device is mlu, return a MLUDistributedDataParallel module.
|
|
|
|
Args:
|
|
model (:class:`nn.Module`): module to be parallelized.
|
|
device (str): device type, mlu or cuda.
|
|
|
|
Returns:
|
|
:class:`nn.Module`: parallelized module.
|
|
|
|
References:
|
|
.. [1] https://pytorch.org/docs/stable/generated/torch.nn.parallel.
|
|
DistributedDataParallel.html
|
|
"""
|
|
assert device in ['cuda', 'mlu'], 'Only available for cuda or mlu devices.'
|
|
if device == 'cuda':
|
|
model = model.cuda()
|
|
elif device == 'mlu':
|
|
assert digit_version(mmcv.__version__) >= digit_version('1.5.0'), \
|
|
'Please use MMCV >= 1.5.0 for MLU training!'
|
|
from mmcv.device.mlu import MLUDistributedDataParallel
|
|
ddp_factory['mlu'] = MLUDistributedDataParallel
|
|
model = model.mlu()
|
|
|
|
return ddp_factory[device](model, *args, **kwargs)
|
|
|
|
|
|
def is_mlu_available():
|
|
"""Returns a bool indicating if MLU is currently available."""
|
|
return hasattr(torch, 'is_mlu_available') and torch.is_mlu_available()
|
|
|
|
|
|
def get_device():
|
|
"""Returns an available device, cpu, cuda or mlu."""
|
|
is_device_available = {
|
|
'cuda': torch.cuda.is_available(),
|
|
'mlu': is_mlu_available()
|
|
}
|
|
device_list = [k for k, v in is_device_available.items() if v]
|
|
return device_list[0] if len(device_list) == 1 else 'cpu'
|