|
3D-GPT: Procedural 3D Modeling with Large Language Models
Chunyi Sun, Junlin Han, Weijian Deng, Xinlong Wang, Zishan Qin, Stephen Gould.
To appear in International Conference on 3D Vision (3DV), 2025.
@inproceedings{Sun:3DV2025,
author = {Chunyi Sun and
Junlin Han and
Weijian Deng and
Xinlong Wang and
Zishan Qin and
Stephen Gould},
title = {3D-GPT: Procedural 3D Modeling with Large Language Models},
booktitle = {3DV},
year = {2025}
}
[ paper coming soon |
preprint |
project |
bib ]
|
|
Temporally Grounding Instructional Diagrams in Unconstrained Videos
Jiahao Zhang, Frederic Zhang, Cristian Rodriguez, Yizhak Ben-Shabat, Anoop Cherian, Stephen Gould.
To appear in Winter Conference on Applications of Computer Vision (WACV), 2025.
@inproceedings{Zhang:WACV2025,
author = {Jiahao Zhang and
Frederic Zhang and
Cristian Rodriguez and
Yizhak Ben-Shabat and
Anoop Cherian and
Stephen Gould},
title = {Temporally Grounding Instructional Diagrams in Unconstrained Videos},
booktitle = {WACV},
year = {2025}
}
[ paper coming soon |
bib ]
|
|
Guiding Neural Collapse: Optimising Towards the Nearest Simplex Equiangular Tight Frame
Evan Markou, Thalaiyasingam Ajanthan and Stephen Gould.
To appear in Advances in Neural Information Processing Systems (NeurIPS), 2024.
@inproceedings{Markou:NIPS2024,
author = {Evan Markou and
Thalaiyasingam Ajanthan and
Stephen Gould},
title = {Guiding Neural Collapse: Optimising Towards the Nearest Simplex Equiangular Tight Frame},
booktitle = {NeurIPS},
year = {2024}
}
[ paper coming soon |
preprint |
bib ]
|
|
Neural Experts: Mixture of Experts for Implicit Neural Representations
Yizhak Ben-Shabat, Chamin Hewa Koneputugodage, Sameera Ramasinghe and Stephen Gould.
To appear in Advances in Neural Information Processing Systems (NeurIPS), 2024.
@inproceedings{BenShabat:NIPS2024,
author = {Yizhak Ben-Shabat and
Chamin Hewa Koneputugodage and
Sameera Ramasinghe and
Stephen Gould},
title = {Neural Experts: Mixture of Experts for Implicit Neural Representations},
booktitle = {NeurIPS},
year = {2024}
}
[ paper coming soon |
bib ]
|
|
Unsupervised Dense Prediction using Differentiable Normalized Cuts
Yanbin Liu and Stephen Gould.
In proceedings of the European Conference on Computer Vision (ECCV), 2024.
@inproceedings{Liu:ECCV2024,
author = {Yanbin Liu and
Stephen Gould},
title = {Unsupervised Dense Prediction using Differentiable Normalized Cuts},
booktitle = {ECCV},
year = {2024}
}
[ paper |
video |
bib ]
|
|
The First to Know: How Token Distributions Reveal Hidden Knowledge in Large Vision-Language Models?
Qinyu Zhao, Ming Xu, Kartik Gupta, Akshay Asthana, Liang Zheng and Stephen Gould.
In proceedings of the European Conference on Computer Vision (ECCV), 2024.
@inproceedings{Zhao:ECCV2024,
author = {Qinyu Zhao and
Ming Xu and
Kartik Gupta and
Akshay Asthana and
Liang Zheng and
Stephen Gould},
title = {The First to Know: How Token Distributions Reveal Hidden Knowledge in Large Vision-Language Models?},
booktitle = {ECCV},
year = {2024}
}
[ paper coming soon |
preprint |
project |
bib ]
|
|
An Empirical Study into What Matters for Calibrating Vision-Language Models
Weijie Tu, Weijian Deng, Dylan Campbell, Stephen Gould and Tom Gedeon.
In the International Conference on Machine Learning (ICML), 2024.
@inproceedings{Tu:ICML2024,
author = {Weijie Tu and
Weijian Deng and
Dylan Campbell and
Stephen Gould and
Tom Gedeon},
title = {An Empirical Study into What Matters for Calibrating Vision-Language Models},
booktitle = {ICML},
year = {2024}
}
[ paper |
bib ]
|
|
Temporally Consistent Unbalanced Optimal Transport for Unsupervised Action Segmentation
Ming Xu and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2024.
@inproceedings{Xu:CVPR2024,
author = {Ming Xu and
Stephen Gould},
title = {Temporally Consistent Unbalanced Optimal Transport for Unsupervised Action Segmentation},
booktitle = {CVPR},
year = {2024}
}
[ paper |
preprint |
code |
bib ]
|
|
Small Steps and Level Sets: Fitting Neural Surface Models with Point Guidance
Chamin Hewa Koneputugodage, Yizhak Ben-Shabat, Dylan Campbell and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2024.
@inproceedings{Koneputugodage:CVPR2024,
author = {Chamin Hewa Koneputugodage and
Yizhak Ben-Shabat and
Dylan Campbell and
Stephen Gould},
title = {Small Steps and Level Sets: Fitting Neural Surface Models with Point Guidance},
booktitle = {CVPR},
year = {2024}
}
[ paper |
talk |
code |
bib ]
|
|
Differentiable Neural Surface Refinement for Transparent Objects
Weijian Deng, Dylan Campbell, Chunyi Sun, Shubham Kanitkar, Matthew E. Shaffer and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2024.
@inproceedings{Deng:CVPR2024,
author = {Weijian Deng and
Dylan Campbell and
Chunyi Sun and
Shubham Kanitkar and
Matthew E. Shaffer and
Stephen Gould},
title = {Differentiable Neural Surface Refinement for Transparent Objects},
booktitle = {CVPR},
year = {2024}
}
[ paper |
talk |
project |
bib ]
|
|
Selective View Pipelining: An Efficient Approach for Multi-view Understanding
Yunzhong Hou, Stephen Gould and Liang Zheng.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2024.
@inproceedings{Hou:CVPR2024,
author = {Yunzhong Hou and
Stephen Gould and
Liang Zheng},
title = {Selective View Pipelining: An Efficient Approach for Multi-view Understandingn},
booktitle = {CVPR},
year = {2024}
}
[ paper |
bib ]
|
|
3DInAction: Understanding Human Actions in 3D Point Clouds
Yizhak Ben-Shabat, Oren Shrout and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2024.
@inproceedings{BenShabat:CVPR2024,
author = {Yizhak Ben-Shabat and
Oren Shrout and
Stephen Gould},
title = {{3DInAction}: Understanding Human Actions in {3D} Point Clouds},
booktitle = {CVPR},
year = {2024}
}
[ paper |
preprint |
talk |
code |
bib ]
|
|
Neuro-symbolic Learning of Lifted Action Models from Visual Traces
Kai (Oliver) Xi, Stephen Gould and Sylvie Thiebaux.
In International Conference on Automated Planning and Scheduling (ICAPS), 2024.
@inproceedings{Xi:ICAPS2024,
author = {Kai Xi and
Stephen Gould and
Sylvie Thiebaux},
title = {Neuro-symbolic Learning of Lifted Action Models from Visual Traces},
booktitle = {ICAPS},
year = {2024}
}
[ paper |
bib ]
|
|
Candidate Set Re-ranking for Composed Image Retrieval with Dual Multi-modal Encoder
Zheyuan Liu, Weixuan Sun, Damien Teney and Stephen Gould.
In Transactions on Machine Learning Research (TMLR), 2024.
@article{Liu:TMLR2024,
author = {Zheyuan Liu and
Weixuan Sun and
Damien Teney and
Stephen Gould},
title = {Candidate Set Re-ranking for Composed Image Retrieval with Dual Multi-modal Encoder},
journal = {TMLR},
year = {2024}
}
[ paper |
pre-print |
project |
bib ]
|
|
Towards Optimal Feature-Shaping Methods for Out-of-Distribution Detection
Qinyu Zhao, Ming Xu, Kartik Gupta, Akshay Asthana, Liang Zheng and Stephen Gould.
In International Conference on Learning Representations (ICLR), 2024.
@inproceedings{Zhao:ICLR2024,
author = {Qinyu Zhao and
Ming Xu and
Kartik Gupta and
Akshay Asthana and
Liang Zheng and
Stephen Gould},
title = {Towards Optimal Feature-Shaping Methods for Out-of-Distribution Detection},
booktitle = {ICLR},
year = {2024}
}
[ paper |
bib ]
|
|
View-coherent Correlation Consistency for Semi-supervised Semantic Segmentation
Yunzhong Hou, Stephen Gould and Liang Zheng.
In Pattern Recognition, 2024.
@article{Hou:PR2024,
author = {Yunzhong Hou and
Stephen Gould and
Liang Zheng},
title = {View-coherent Correlation Consistency for Semi-supervised Semantic Segmentation},
journal = {Pattern Recognition},
year = {2024}
}
[ paper |
bib ]
|
|
Ray Deformation Networks for Novel View Synthesis of Refractive Objects
Weijian Deng, Dylan Campbell, Chunyi Sun, Shubham Kanitkar, Matthew Shaffer and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2024.
@inproceedings{Deng:WACV24,
author = {Weijian Deng and
Dylan Campbell and
Chunyi Sun and
Shubham Kanitkar and
Matthew Shaffer and
Stephen Gould},
title = {Ray Deformation Networks for Novel View Synthesis of Refractive Objects},
booktitle = {WACV},
year = {2024}
}
[ paper |
project |
bib ]
|
|
IKEA Ego 3D dataset: Understanding furniture assembly actions from ego view 3D Point Clouds
Yizhak Ben-Shabat, Oren Shrout, Jonathan Paul, Eviatar Segev and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2024.
@inproceedings{BenShabat:WACV24,
author = {Yizhak Ben-Shabat and
Oren Shrout and
Jonathan Paul and
Eviatar Segev and
Stephen Gould},
title = {{IKEA} {Ego} {3D} dataset: Understanding furniture assembly actions from ego view {3D} Point Clouds},
booktitle = {WACV},
year = {2024}
}
[ paper |
bib ]
|
|
LipAT: Beyond Style Transfer for Controllable Neural Simulation of Lipstick using Cosmetic Attributes
Amila Silva, Olga Moskvyak, Alexander Long, Ravi Garg, Stephen Gould, Gil Avraham and Anton van den Hengel.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2024.
@inproceedings{Silva:WACV24,
author = {Amila Silva and
Olga Moskvyak and
Alexander Long and
Ravi Garg and
Stephen Gould and
Gil Avraham and
Anton van den Hengel},
title = {{LipAT}: Beyond Style Transfer for Controllable Neural Simulation of Lipstick using Cosmetic Attributes}
booktitle = {WACV},
year = {2024}
}
[ paper |
bib ]
|
|
NeRFEditor: Differentiable Style Decomposition for 3D Scene Editing
Chunyi Sun, Yanbin Liu, Junlin Han and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2024.
@inproceedings{Sun:WACV24,
author = {Chunyi Sun and
Yanbin Liu and
Junlin Han and
Stephen Gould},
title = {{NeRFEditor}: Differentiable Style Decomposition for {3D} Scene Editing},
booktitle = {WACV},
year = {2024}
}
[ paper |
bib ]
|
|
Bi-directional Training for Composed Image Retrieval via Text Prompt Learning
Zheyuan Liu, Weixuan Sun, Yicong Hong, Damien Teney and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2024.
@inproceedings{Liu:WACV24,
author = {Zheyuan Liu and
Weixuan Sun and
Yicong Hong and
Damien Teney and
Stephen Gould},
title = {Bi-directional Training for Composed Image Retrieval via Text Prompt Learning},
booktitle = {WACV},
year = {2024}
}
[ paper |
bib ]
|
|
Revisiting Implicit Differentiation for Learning Problems in Optimal Control
Ming Xu, Timothy Molloy and Stephen Gould.
In Advances in Neural Information Processing Systems (NeurIPS), 2023.
@inproceedings{Xu:NeurIPS23,
author = {Ming Xu and
Timothy L. Molloy and
Stephen Gould},
title = {Revisiting Implicit Differentiation for Learning Problems in Optimal Control},
booktitle = {NeurIPS},
year = {2023}
}
[ paper |
preprint |
code |
bib ]
|
|
Exploring Predictive Visual Context for Detecting Human–Object Interactions
Frederic Zhang, Yuhui Yuan, Dylan Campbell, Zhuoyao Zhong and Stephen Gould.
In IEEE International Conference on Computer Vision (ICCV), 2023.
@inproceedings{Zhang:ICCV23,
author = {Frederic Zhang and
Yuhui Yuan and
Dylan Campbell and
Zhuoyao Zhong and
Stephen Gould},
title = {Exploring Predictive Visual Context for Detecting Human–Object Interactions},
booktitle = {ICCV},
year = {2023}
}
[ paper |
preprint |
code |
bib ]
|
|
Semi-Supervised Semantic Segmentation under Label Noise via Diverse Learning Groups
Peixia Li, Pulak Purkait, Thalaiyasingam Ajanthan, Majid Abdolshah, Ravi Garg, Hisham Husain, Chenchen Xu, Stephen Gould, Wanli Ouyang and Anton van den Hengel.
In IEEE International Conference on Computer Vision (ICCV), 2023.
@inproceedings{Li:ICCV23,
author = {Peixia Li and
Pulak Purkait and
Thalaiyasingam Ajanthan and
Majid Abdolshah and
Ravi Garg and
Hisham Husain and
Chenchen Xu and
Stephen Gould and
Wanli Ouyang and
Anton van den Hengel},
title = {Semi-Supervised Semantic Segmentation under Label Noise via Diverse Learning Groups},
booktitle = {ICCV},
year = {2023}
}
[ paper |
bib ]
|
|
Scaling Data Generation in Vision-and-Language Navigation
Zun Wang, Jialu Li, Yicong Hong, Yi Wang, Qi Wu, Mohit Bansal, Stephen Gould, Hao Tan and Yu Qiao.
In IEEE International Conference on Computer Vision (ICCV), 2023.
@inproceedings{Wang:ICCV23,
author = {Zun Wang and
Jialu Li and
Yicong Hong and
Yi Wang and
Qi Wu and
Mohit Bansal and
Stephen Gould and
Hao Tan and
Yu Qiao},
title = {Scaling Data Generation in Vision-and-Language Navigation},
booktitle = {ICCV},
year = {2023}
}
[ paper |
code |
bib ]
|
|
Learning Navigational Visual Representations with Semantic Map Supervision
Yicong Hong, Yang Zhou, Ruiyi Zhang, Franck Dernoncourt, Trung Bui, Stephen Gould and Hao Tan.
In IEEE International Conference on Computer Vision (ICCV), 2023.
@inproceedings{Hong:ICCV23,
author = {Yicong Hong and
Yang Zhou and
Ruiyi Zhang and
Franck Dernoncourt and
Trung Bui and
Stephen Gould and
Hao Tan},
title = {Learning Navigational Visual Representations with Semantic Map Supervision},
booktitle = {ICCV},
year = {2023}
}
[ paper |
bib ]
|
|
Towards Understanding Gradient Approximation in Equality Constrained Deep Declarative Networks
Stephen Gould, Ming Xu, Zhiwei Xu, Yanbin Liu.
In the ICML Workshop on Differentiable Almost Everything, 2023.
@inproceedings{Gould:ICML23w,
author = {Stephen Gould and
Ming Xu and
Zhiwei Xu and
Yanbin Liu},
title = {Towards Understanding Gradient Approximation in Equality Constrained Deep Declarative Networks},
booktitle = {ICML Workshop on Differentiable Almost Everything: Differentiable Relaxations, Algorithms, Operators, and Simulators},
year = {2023}
}
[ preprint |
code |
bib ]
|
|
PMaF: Deep Declarative Layers for Principal Matrix Features
Zhiwei Xu, Hao Wang, Yanbin Liu and Stephen Gould.
In the ICML Workshop on Differentiable Almost Everything, 2023.
@inproceedings{Xu:ICML23w,
author = {Zhiwei Xu and
Hao Wang and
Yanbin Liu and
Stephen Gould},
title = {{PMaF}: Deep Declarative Layers for Principal Matrix Features},
booktitle = {ICML Workshop on Differentiable Almost Everything: Differentiable Relaxations, Algorithms, Operators, and Simulators},
year = {2023}
}
[ preprint |
code |
bib ]
|
|
Confidence and Dispersity Speak: Characterizing Prediction Matrix for Unsupervised Accuracy Estimation
Weijian Deng, Yumin Suh, Stephen Gould and Liang Zheng.
In the International Conference on Machine Learning (ICML), 2023.
@inproceedings{Deng:ICML23,
author = {Weijian Deng and
Yumin Suh and
Stephen Gould and
Liang Zheng},
title = {Confidence and Dispersity Speak: Characterizing Prediction Matrix for Unsupervised Accuracy Estimation},
booktitle = {ICML},
year = {2023}
}
[ paper coming soon |
code coming soon |
bib ]
|
|
Octree Guided Unoriented Surface Reconstruction
Chamin Hewa Koneputugodage, Yizhak Ben-Shabat and Stephen Gould.
In the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2023.
@inproceedings{Koneputugodage:CVPR23,
author = {Chamin Hewa Koneputugodage and
Yizhak Ben-Shabat and
Stephen Gould},
title = {Octree Guided Unoriented Surface Reconstruction},
booktitle = {CVPR},
year = {2023}
}
[ paper |
project |
code |
bib ]
|
|
Aligning Step-by-Step Instructional Diagrams to Video Demonstrations
Jiahao Zhang, Anoop Cherian, Yanbin Liu, Yizhak Ben-Shabat, Cristian Rodriguez and Stephen Gould.
In the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2023.
@inproceedings{Zhang:CVPR23,
author = {Jiahao Zhang and
Anoop Cherian and
Yanbin Liu and
Yizhak Ben-Shabat and
Cristian Rodriguez and
Stephen Gould},
title = {Aligning Step-by-Step Instructional Diagrams to Video Demonstrations},
booktitle = {CVPR},
year = {2023}
}
[ paper |
preprint |
code |
dataset |
project |
bib ]
|
|
High-Fidelity Guided Image Synthesis with Latent Diffusion Models
Jaskirat Singh, Liang Zheng and Stephen Gould.
In the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2023.
@inproceedings{Singh:CVPR23,
author = {Jaskirat Singh,
Liang Zheng and
Stephen Gould},
title = {High-Fidelity Guided Image Synthesis with Latent Diffusion Models},
booktitle = {CVPR},
year = {2023}
}
[ paper |
preprint |
project |
bib ]
|
|
Deep Declarative Dynamic Time Warping for End-to-end Learning of Alignment Paths
Ming Xu, Sourav Garg, Michael Milford and Stephen Gould.
In International Conference on Learning Representations (ICLR), 2023.
@inproceedings{Xu:ICLR23,
author = {Ming Xu and
Sourav Garg and
Michael Milford and
Stephen Gould},
title = {Deep Declarative Dynamic Time Warping for End-to-end Learning of Alignment Paths},
booktitle = {ICLR},
year = {2023}
}
[ paper |
preprint |
code |
bib ]
|
|
On the Strong Correlation Between Model Invariance and Generalization
Weijian Deng, Stephen Gould and Liang Zheng.
In Advances in Neural Information Processing Systems (NeurIPS), 2022.
@inproceedings{Deng:NeurIPS22,
author = {Weijian Deng and
Stephen Gould and
Liang Zheng},
title = {On the Strong Correlation Between Model Invariance and Generalization},
booktitle = {NeurIPS},
year = {2022}
}
[ paper |
bib ]
|
|
GoferBot: A Visual Guided Human-Robot Collaborative Assembly System
Zheyu Zhuang, Yizhak Ben-Shabat, Jiahao Zhang, Stephen Gould and Robert Mahony.
In International Conference on Intelligent Robots and Systems (IROS), 2022.
@inproceedings{Zhuang:IROS2022,
author = {Zheyu Zhuang,
Yizhak Ben-Shabat,
Jiahao Zhang,
Stephen Gould and
Robert Mahony},
title = {{GoferBot}: A Visual Guided Human-Robot Collaborative Assembly System},
booktitle = {IROS},
year = {2022}
}
[ paper |
video |
bib ]
|
|
Fine-grained Classification via Categorical Memory Networks
Weijian Deng, Joshua Marsh, Stephen Gould and Liang Zheng.
In the IEEE Transactions on Image Processing (TIP), 2022.
@article{Deng:TIP2022,
author = {Weijian Deng and
Joshua Marsh and
Stephen Gould and
Liang Zheng},
title = {Fine-grained Classification via Categorical Memory Networks},
journal = {TIP},
year = {2022}
}
[ paper |
preprint |
bib ]
|
|
Bridging the Gap Between Learning in Discrete and Continuous Environments for Vision-and-Language Navigation
Yicong Hong, Zun Wang, Qi Wu and Stephen Gould.
In the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022.
@inproceedings{Hong:CVPR2022,
author = {Yicong Hong and
Zun Wang and
Qi Wu and
Stephen Gould},
title = {Bridging the Gap Between Learning in Discrete and Continuous Environments for Vision-and-Language Navigation},
booktitle = {CVPR},
year = {2022}
}
[ paper |
preprint |
bib ]
|
|
Efficient Two-Stage Detection of Human-Object Interactions with a Novel Unary-Pairwise Transformer
Zhen Zhang, Dylan Campbell and Stephen Gould.
In the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022.
@inproceedings{Zhang:CVPR2022,
author = {Zhen Zhang and
Dylan Campbell and
Stephen Gould},
title = {Efficient Two-Stage Detection of Human-Object Interactions with a Novel Unary-Pairwise Transformer},
booktitle = {CVPR},
year = {2022}
}
[ paper |
preprint |
code |
bib ]
|
|
DiGS: Divergence Guided Shape Implicit Neural Representation for Unoriented Point Clouds
Yizhak Ben-Shabat, Chamin Hewa Koneputugodage and Stephen Gould.
In the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022.
@inproceedings{BenShabat:CVPR2022,
author = {Yizhak Ben-Shabat and
Chamin Hewa Koneputugodage and
Stephen Gould},
title = {{DiGS}: Divergence guided shape implicit neural representation for unoriented point clouds},
booktitle = {CVPR},
year = {2022}
}
[ paper |
preprint |
project |
code |
bib ]
|
|
Exploiting Problem Structure in Deep Declarative Networks: Two Case Studies
Stephen Gould, Dylan Campbell, Yizhak Ben-Shabat, Chamin Hewa Koneputugodage and Zhiwei Xu.
In the First AAAI Workshop on Optimal Transport and Structured Data Modeling (OT-SDM), 2022.
@inproceedings{Gould:OTSDM2022,
author = {Stephen Gould and
Dylan Campbell and
Yizhak Ben-Shabat and
Chamin Hewa Koneputugodage and
Zhiwei Xu},
title = {Exploiting Problem Structure in Deep Declarative Networks: Two Case Studies},
booktitle = {First AAAI Workshop on Optimal Transport and Structured Data Modeling ({OT-SDM})},
year = {2022}
}
[ paper |
slides |
preprint |
code (rvp) |
code (ot) |
video |
bib ]
|
|
Rethinking Conditional GAN Training: An Approach Using Geometrically Structured Latent Manifolds
Sameera Ramasinghe, Moshiur R. Farazi, Salman Khan, Nick Barnes and Stephen Gould.
In Advances in Neural Information Processing Systems (NeurIPS), 2021.
@inproceedings{Ramasinghe:NeurIPS2021,
author = {Sameera Ramasinghe and
Moshiur R. Farazi and
Salman Khan and
Nick Barnes and
Stephen Gould},
title = {Rethinking conditional {GAN} training: An approach using geometrically structured latent manifolds},
booktitle = {NeurIPS},
year = {2021}
}
[ paper |
preprint |
code |
bib ]
|
|
A Regularized Wasserstein Framework for Graph Kernels
Asiri Wijesinghe, Qing Wang and Stephen Gould.
In IEEE International Conference on Data Mining (ICDM), 2021.
@inproceedings{Wijesinghe:ICDM2021,
author = {Asiri Wijesinghe and
Qing Wang and
Stephen Gould},
title = {A Regularized Wasserstein Framework for Graph Kernels},
booktitle = {ICDM},
year = {2021}
}
[ paper |
preprint |
bib ]
|
|
Spatially Conditioned Graphs for Detecting Human-Object Interactions
Frederic Z. Zhang, Dylan Campbell and Stephen Gould.
In IEEE International Conference on Computer Vision (ICCV), 2021.
@inproceedings{Zhang:ICCV2021,
author = {Frederic Zhen Zhang and
Dylan Campbell and
Stephen Gould},
title = {Spatially Conditioned Graphs for Detecting Human-Object Interactions},
booktitle = {ICCV},
year = {2021}
}
[ paper |
preprint |
video |
code |
bib ]
|
|
Image Retrieval on Real-life Images with Pre-trained Vision-and-Language Models
Zheyuan Liu, Cristian Rodriguez, Damien Teney and Stephen Gould.
In IEEE International Conference on Computer Vision (ICCV), 2021.
@inproceedings{Liu:ICCV2021,
author = {Zheyuan Liu and
Cristian Rodriguez and
Damien Teney and
Stephen Gould},
title = {Image Retrieval on Real-life Images with Pre-trained Vision-and-Language Models},
booktitle = {ICCV},
year = {2021}
}
[ paper |
data |
bib ]
|
|
Contextually Plausible and Diverse 3D Human Motion Prediction
Sadegh Aliakbarian, Fatemeh Saleh, Lars Petersson, Stephen Gould and Mathieu Salzmann.
In IEEE International Conference on Computer Vision (ICCV), 2021.
@inproceedings{Aliakbarian:ICCV2021,
author = {Sadegh Aliakbarian and
Fatemeh Saleh and
Lars Petersson and
Stephen Gould and
Mathieu Salzmann},
title = {Contextually Plausible and Diverse 3{D} Human Motion Prediction},
booktitle = {ICCV},
year = {2021}
}
[ paper |
bib ]
|
|
What Does Rotation Prediction Tell Us about Classifier Accuracy under Varying Testing Environments?
Weijian Deng, Stephen Gould and Liang Zheng.
In International Conference on Machine Learning (ICML), 2021.
@inproceedings{Deng:ICML2021,
author = {Weijian Deng and
Stephen Gould and
Liang Zheng},
title = {What Does Rotation Prediction Tell Us about Classifier Accuracy under Varying Testing Environments?},
booktitle = {ICML},
year = {2021}
}
[ paper coming soon |
preprint |
code |
bib ]
|
|
A Recurrent Vision-and-Language BERT for Navigation
Yicong Hong, Qi Wu, Yuankai Qi, Cristian Rodriguez and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2021.
@inproceedings{Hong:CVPR2021,
author = {Yicong Hong and
Qi Wu and
Yuankai Qi and
Cristian Rodriguez and
Stephen Gould},
title = {A Recurrent Vision-and-Language {BERT} for Navigation},
booktitle = {CVPR},
year = {2021}
}
[ paper |
preprint |
code |
bib ]
|
|
Probabilistic Tracklet Scoring and Inpainting for Multiple Object Tracking
Fatemeh Saleh, Sadegh Aliakbarian, Hamid Rezatofighi, Mathieu Salzmann and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2021.
@inproceedings{Saleh:CVPR2021,
author = {Fatemeh Saleh and
Sadegh Aliakbarian and
Hamid Rezatofighi and
Mathieu Salzmann and
Stephen Gould},
title = {Probabilistic Tracklet Scoring and Inpainting for Multiple Object Tracking},
booktitle = {CVPR},
year = {2021}
}
[ paper |
preprint |
code |
bib ]
|
|
Deep Declarative Networks
Stephen Gould, Richard Hartley and Dylan Campbell.
In IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI), 2021.
@article{Gould:PAMI2021,
author = {Stephen Gould and
Richard Hartley and
Dylan Campbell},
title = {Deep Declarative Networks},
journal = {PAMI},
year = {2021},
doi = {10.1109/TPAMI.2021.3059462}
}
[ paper |
preprint |
code & resources |
bib ]
|
|
Conditional Generative Modeling via Learning the Latent Space
Sameera Ramasinghe, Kanchana Nisal Ranasinghe, Salman Khan, Nick Barnes and Stephen Gould.
In International Conference on Learning Representations (ICLR), 2021.
@inproceedings{Ramasinghe:ICLR2021,
author = {Sameera Ramasinghe and
Kanchana Nisal Ranasinghe and
Salman Khan and
Nick Barnes and
Stephen Gould},
title = {Conditional Generative Modeling via Learning the Latent Space},
booktitle = {ICLR},
year = {2021}
}
[ paper |
bib ]
|
|
DORi: Discovering Objects Relationship for Temporal Moment Localization of a Natural-Language Query in Video
Cristian Rodriguez, Edison Marrese-Taylor, Basura Fernando, Hongdong Li and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2021.
@inproceedings{Rodriguez:WACV2021,
author = {Cristian Rodriguez and
Edison Marrese-Taylor and
Basura Fernando and
Hongdong Li and
Stephen Gould},
title = {{DORi}: Discovering Objects Relationship for Temporal Moment Localization of a Natural-Language Query in Video},
booktitle = {WACV},
year = {2021}
}
[ paper |
bib ]
|
|
The IKEA ASM Dataset: Understanding People Assembling Furniture through Actions, Objects and Pose
Yizhak Ben-Shabat, Xin Yu, Fatemeh Saleh, Dylan Campbell, Cristian Rodriguez, Hongdong Li and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2021.
@inproceedings{BenShabat:WACV2021,
author = {Yizhak Ben-Shabat and
Xin Yu and
Fatemeh Saleh and
Dylan Campbell and
Cristian Rodriguez and
Hongdong Li and
Stephen Gould},
title = {The {IKEA} {ASM} Dataset: Understanding People Assembling Furniture through Actions, Objects and Pose},
booktitle = {WACV},
year = {2021}
}
[ paper |
website |
code |
bib ]
|
|
Semantics for Robotic Mapping, Perception and Interaction: A Survey
Sourav Garg, Niko Sunderhauf, Feras Dayoub, Douglas Morrison, Akansel Cosgun, Gustavo Carneiro, Qi Wu, Tat-Jun Chin, Ian Reid, Stephen Gould, Peter Corke and Michael Milford.
In Foundations and Trends in Robotics, 2020.
@article{Garg:Survey2020,
author = {Sourav Garg and
Niko Sunderhauf and
Feras Dayoub and
Douglas Morrison and
Akansel Cosgun and
Gustavo Carneiro and
Qi Wu and
Tat-Jun Chin and
Ian Reid and
Stephen Gould and
Peter Corke and
Michael Milford},
title = {Semantics for Robotic Mapping, Perception and Interaction: A Survey},
journal = {Foundations and Trends® in Robotics},
year = {2020},
volume = {8},
number = {1–2},
pages = {1-224}
}
[ paper |
preprint |
bib ]
|
|
Language and Visual Entity Relationship Graph for Agent Navigation
Yicong Hong, Cristian Rodriguez, Yuankai Qi, Qi Wu and Stephen Gould.
In Advances in Neural Information Processing Systems (NeurIPS), 2020.
@inproceedings{Hong:NeurIPS2020,
author = {Yicong Hong and
Cristian Rodriguez and
Yuankai Qi and
Qi Wu and
Stephen Gould},
title = {Language and Visual Entity Relationship Graph for Agent Navigation},
booktitle = {NeurIPS},
year = {2020}
}
[ paper |
code |
bib ]
|
|
Joint Unsupervised Learning of Optical Flow and Egomotion with Bi-Level Optimization
Shihao Jiang, Dylan Campbell, Miaomiao Liu, Stephen Gould and Richard Hartley.
In International Conference on 3D Vision (3DV), 2020.
@inproceedings{Jiang:3DV2020,
author = {Shihao Jiang and
Dylan Campbell and
Miaomiao Liu and
Stephen Gould and
Richard Hartley},
title = {Joint Unsupervised Learning of Optical Flow and Egomotion with Bi-Level Optimization},
booktitle = {3DV},
year = {2020}
}
[ paper |
preprint |
bib ]
|
|
Sub-Instruction Aware Vision-and-Language Navigation
Yicong Hong, Cristian Rodriguez, Qi Wu and Stephen Gould.
In Conference on Empirical Methods in Natural Language Processing (EMNLP), 2020.
@inproceedings{Hong:EMNLP2020,
author = {Yicong Hong and
Cristian Rodriguez and
Qi Wu and
Stephen Gould},
title = {Sub-Instruction Aware Vision-and-Language Navigation},
booktitle = {EMNLP},
year = {2020}
}
[ paper |
preprint |
code |
bib ]
|
|
DeepFit: 3D Surface Fitting by Neural Network Weighted Least Squares
Yizhak Ben-Shabat and Stephen Gould.
In Proceedings of the European Conference on Computer Vision (ECCV), 2020.
@inproceedings{BenShabat:ECCV2020,
author = {Yizhak Ben-Shabat and
Stephen Gould},
title = {DeepFit: 3D Surface Fitting by Neural Network Weighted Least Squares},
booktitle = {ECCV},
year = {2020}
}
[ paper |
preprint |
talk |
code |
bib ]
|
|
Multiview Pedestrian Detection with Feature Perspective Transformation
Yunzhong Hou, Liang Zheng and Stephen Gould.
In Proceedings of the European Conference on Computer Vision (ECCV), 2020.
@inproceedings{Hou:ECCV2020,
author = {Yunzhong Hou and
Liang Zheng and
Stephen Gould},
title = {Multiview Pedestrian Detection with Feature Perspective Transformation},
booktitle = {ECCV},
year = {2020}
}
[ paper |
preprint |
bib ]
|
|
Solving the Blind Perspective-n-Point Problem End-To-End with Robust Differentiable Geometric Optimization
Dylan Campbell, Liu Liu and Stephen Gould.
In Proceedings of the European Conference on Computer Vision (ECCV), 2020.
@inproceedings{Campbell:ECCV2020,
author = {Dylan Campbell and
Liu Liu and
Stephen Gould},
title = {Solving the Blind Perspective-n-Point Problem End-To-End with Robust Differentiable Geometric Optimization},
booktitle = {ECCV},
year = {2020}
}
[ paper |
talk |
preprint |
code |
bib ]
|
|
Spectral-GANs for High-Resolution 3D Point-cloud Generation
Sameera Ramasinghe, Salman Khan, Nick Barnes and Stephen Gould.
In International Conference on Intelligent Robots and Systems (IROS), 2020.
@inproceedings{Ramasinghe:IROS2020,
author = {Sameera Ramasinghe and
Salman Khan and
Nick Barnes and
Stephen Gould},
title = {Spectral-GANs for High-Resolution 3D Point-cloud Generation},
booktitle = {IROS},
year = {2020}
}
[ paper |
preprint |
bib ]
|
|
Inferring Temporal Compositions of Actions Using Probabilistic Automata
Rodrigo Santa Cruz, Dylan Campbell, Anoop Cherian, Basura Fernando and Stephen Gould.
In Workshop on Compositionality in Computer Vision at CVPR, 2020.
@inproceedings{SantaCruz:CVPRW2020,
author = {Rodrigo Santa Cruz and
Dylan Campbell and
Anoop Cherian and
Basura Fernando and
Stephen Gould},
title = {Inferring Temporal Compositions of Actions Using Probabilistic Automata},
booktitle = {CVPR Workshop on Compositionality in Computer Vision},
year = {2020}
}
[ paper |
preprint |
bib ]
|
|
Enhanced Light-Matter Interactions in Dielectric Nanostructures via Machine Learning Approach
Lei Xu, Mohsen Rahmani, Yixuan Ma, Daria A. Smirnova, Khosro Zangeneh Kamali, Fu Deng, Yan Kei Chiang, Lujun Huang, Haoyang Zhang, Stephen Gould, Dragomir N. Neshev and Andrey E. Miroshnichenko.
In Advanced Photonics, 2020.
@article{Xu:AdvPho2020,
author = {Lei Xu and
Mohsen Rahmani and
Yixuan Ma and
Daria A. Smirnova and
Khosro Zangeneh Kamali and
Fu Deng and
Yan Kei Chiang and
Lujun Huang and
Haoyang Zhang and
Stephen Gould and
Dragomir N. Neshev and
Andrey E. Miroshnichenko},
title = {Enhanced Light-Matter Interactions in Dielectric Nanostructures via Machine Learning Approach},
journal = {Advanced Photonics},
year = {2020}
}
[ paper |
preprint |
bib ]
|
|
A Stochastic Conditioning Scheme for Diverse Human Motion Prediction
Sadegh Aliakbarian, Fatemeh Saleh, Mathieu Salzmann, Lars Petersson, Stephen Gould and Amir Habibian.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2020.
@inproceedings{Aliakbarian:CVPR2020,
author = {Sadegh Aliakbarian and
Fatemeh Saleh and
Mathieu Salzmann and
Lars Petersson and
Stephen Gould and
Amir Habibian},
title = {A Stochastic Conditioning Scheme for Diverse Human Motion Prediction},
booktitle = {CVPR},
year = {2020}
}
[ paper |
code |
bib ]
|
|
Learning to Structure an Image with Few Colors
Yunzhong Hou, Liang Zheng and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2020.
@inproceedings{Hou:CVPR2020,
author = {Yunzhong Hou and
Liang Zheng and
Stephen Gould},
title = {Learning to Structure an Image with Few Colors},
booktitle = {CVPR},
year = {2020}
}
[ paper |
preprint |
bib ]
|
|
A Signal Propagation Perspective for Pruning Neural Networks at Initialization
Namhoon Lee, Thalaiyasingam Ajanthan, Stephen Gould and Philip H. S. Torr.
In International Conference on Learning Representations (ICLR), 2020.
@inproceedings{Lee:ICLR2020,
author = {Namhoon Lee and
Thalaiyasingam Ajanthan and
Stephen Gould and
Philip H. S. Torr},
title = {A Signal Propagation Perspective for Pruning Neural Networks at Initialization},
booktitle = {ICLR},
year = {2020}
}
[ paper and talk |
preprint |
bib ]
|
|
Representation Learning on Unit Ball with 3D Roto-translational Equivariance
Sameera Ramasinghe, Salman Khan, Stephen Gould and Nick Barnes.
In International Journal of Computer Vision (IJCV), 2020.
@article{Ramasinghe:IJCV2020,
author = {Sameera Ramasinghe and
Salman Khan and
Stephen Gould and
Nick Barnes},
title = {Representation Learning on Unit Ball with 3D Roto-translational Equivariance},
journal = {IJCV},
year = {2020}
}
[ paper |
preprint |
bib ]
|
|
Proposal-free Temporal Moment Localization of a Natural-language Query in Video using Guided Attention
Cristian Rodriguez Opazo, Edison Marrese-Taylor, Fatemeh Sadat Saleh, Hongdong Li and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2020.
@inproceedings{Opazo:WACV2020,
author = {Cristian Rodriguez Opazo and
Edison Marrese-Taylor and
Fatemeh Sadat Saleh and
Hongdong Li and
Stephen Gould},
title = {Proposal-free Temporal Moment Localization of a Natural-language Query in Video using Guided Attention},
booktitle = {WACV},
year = {2020}
}
[ paper |
arXiv |
bib ]
|
|
Blended Convolution and Synthesis for Efficient Discrimination of 3D Shapes
Sameera Ramasinghe, Salman Khan, Nick Barnes and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2020.
@inproceedings{Ramasinghe:WACV2020,
author = {Sameera Ramasinghe and
Salman Khan and
Nick Barnes and
Stephen Gould},
title = {Blended Convolution and Synthesis for Efficient Discrimination of 3D Shapes},
booktitle = {WACV},
year = {2020}
}
[ paper |
bib ]
|
|
Learning to Find Common Objects Across Image Collections
Amirreza Shaban, Amir Rahimi, Shray Bansal, Stephen Gould, Byron Boots and Richard Hartley.
In IEEE International Conference on Computer Vision (ICCV), 2019.
@inproceedings{Shaban:ICCV2019,
author = {Amirreza Shaban and
Amir Rahimi and
Shray Bansal and
Stephen Gould and
Byron Boots and
Richard Hartley},
title = {Learning to Find Common Objects Across Image Collections},
booktitle = {ICCV},
year = {2019}
}
[ paper |
code |
bib ]
|
|
The Alignment of the Spheres: Globally-Optimal Spherical Mixture Alignment for Camera Pose Estimation
Dylan Campbell, Lars Petersson, Laurent Kneip, Hongdong Li and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2019.
@article{Campbell:CVPR2019,
author = {Dylan Campbell and
Lars Petersson and
Laurent Kneip and
Hongdong Li and
Stephen Gould},
title = {The Alignment of the Spheres: Globally-Optimal Spherical Mixture Alignment for Camera Pose Estimation},
journal = {CVPR},
year = {2019}
}
[ paper |
arXiv |
bib ]
|
|
Visual Permutation Learning
Rodrigo Santa Cruz, Basura Fernando, Anoop Cherian and Stephen Gould.
In IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI), 2018.
@article{SantaCruz:PAMI2018,
author = {Rodrigo Santa Cruz and
Basura Fernando and
Anoop Cherian and
Stephen Gould},
title = {Visual Permutation Learning},
journal = {PAMI},
year = {2018}
}
[ paper |
preprint |
bib ]
|
|
Partially-Supervised Image Captioning
Peter Anderson, Stephen Gould and Mark Johnson.
In Advances in Neural Information Processing Systems (NeurIPS), 2018.
@inproceedings{Anderson:NeurIPS2018,
author = {Peter Anderson and
Stephen Gould and
Mark Johnson},
title = {Partially-Supervised Image Captioning},
booktitle = {NeurIPS},
year = {2018}
}
[ pdf |
arXiv |
bib ]
|
|
Second-order Temporal Pooling for Action Recognition
Anoop Cherian and Stephen Gould.
In International Journal of Computer Vision (IJCV), 2018.
@article{Cherian:IJCV2018,
author = {Anoop Cherian and
Stephen Gould},
title = {Second-order Temporal Pooling for Action Recognition},
journal = {IJCV},
year = {2018}
}
[ paper |
preprint |
bib ]
|
|
Non-Linear Temporal Subspace Representations for Activity Recognition
Anoop Cherian, Suvrit Sra, Stephen Gould and Richard Hartley.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2018.
@inproceedings{Cherian:CVPR2018,
author = {Anoop Cherian and
Suvrit Sra and
Stephen Gould and
Richard Hartley},
title = {Non-Linear Temporal Subspace Representations for Activity Recognition},
booktitle = {CVPR},
year = {2018}
}
[ pdf |
bib ]
|
|
Bottom-Up and Top-Down Attention for Image Captioning and Visual Question Answering
Peter Anderson, Xiaodong He, Chris Buehler, Damien Teney, Mark Johnson, Stephen Gould and Lei Zhang.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2018.
@inproceedings{Anderson:CVPR2018a,
author = {Peter Anderson and
Xiaodong He and
Chris Buehler and
Damien Teney and
Mark Johnson and
Stephen Gould and
Lei Zhang},
title = {Bottom-Up and Top-Down Attention for Image Captioning and Visual Question Answering},
booktitle = {CVPR},
year = {2018}
}
[ pdf |
arXiv |
bib ]
|
|
Vision-and-Language Navigation: Interpreting Visually-grounded Navigation Instructions in Real Environments
Peter Anderson, Qi Wu, Damien Teney, Jake Bruce, Mark Johnson, Niko SĂĽnderhauf, Ian Reid, Stephen Gould and Anton van den Hengel.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2018.
@inproceedings{Anderson:CVPR2018b,
author = {Peter Anderson and
Qi Wu and
Damien Teney and
Jake Bruce and
Mark Johnson and
Niko Sunderhauf and
Ian Reid and
Stephen Gould and
Anton van den Hengel},
title = {Vision-and-Language Navigation: Interpreting Visually-grounded Navigation Instructions in Real Environments},
booktitle = {CVPR},
year = {2018}
}
[ pdf |
arXiv |
project |
bib ]
|
|
Video Representation Learning Using Discriminative Pooling
Jue Wang, Anoop Cherian, Fatih Porikli and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2018.
@inproceedings{Wang:CVPR2018,
author = {Jue Wang and
Anoop Cherian and
Fatih Porikli and
Stephen Gould},
title = {Video Representation Learning Using Discriminative Pooling},
booktitle = {CVPR},
year = {2018}
}
[ pdf |
arXiv |
bib ]
|
|
Neural Algebra of Classifiers
Rodrigo Santa Cruz, Basura Fernando, Anoop Cherian and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2018.
@inproceedings{SantaCruz:WACV2018,
author = {Rodrigo Santa Cruz and
Basura Fernando and
Anoop Cherian and
Stephen Gould},
title = {Neural Algebra of Classifiers},
booktitle = {WACV},
year = {2018}
}
[ pdf |
code |
bib ]
|
|
Human Pose Forecasting via Deep Markov Models
Sam Toyer, Anoop Cherian, Tengda (Mike) Han and Stephen Gould.
In International Conference on Digital Image Computing: Techniques and Applications (DICTA), 2017.
@inproceedings{Toyer:DICTA2017,
author = {Sam Toyer and
Anoop Cherian and
Tengda Han and
Stephen Gould},
title = {Human Pose Forecasting via Deep Markov Models},
booktitle = {DICTA},
year = {2017}
}
[ arXiv |
Ikea dataset |
bib ]
|
|
Guided Open Vocabulary Image Captioning with Constrained Beam Search
Peter Anderson, Basura Fernando, Mark Johnson and Stephen Gould.
In Conference on Empirical Methods in Natural Language Processing (EMNLP), 2017.
@inproceedings{Anderson:EMNLP2017,
author = {Peter Anderson and
Basura Fernando and
Mark Johnson and
Stephen Gould},
title = {Guided Open Vocabulary Image Captioning with Constrained Beam Search},
booktitle = {EMNLP},
year = {2017}
}
[ pdf |
bib ]
|
|
Incorporating Network Built-in Priors in Weakly-supervised Semantic Segmentation
Fatemeh Sadat Saleh, Mohammad Sadegh Aliakbarian, Mathieu Salzmann, Lars Petersson, Jose M. Alvarez and Stephen Gould.
In IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI), 2017.
@inproceedings{Saleh:PAMI2017,
author = {Fatemeh Sadat Saleh and
Mohammad Sadegh Aliakbarian and
Mathieu Salzmann and
Lars Petersson and
Jose M. Alvarez and
Stephen Gould},
title = {Incorporating Network Built-in Priors in Weakly-supervised Semantic Segmentation},
booktitle = {PAMI},
year = {2017}
}
[ paper |
preprint |
bib ]
|
|
Discriminatively Learned Hierarchical Rank Pooling Networks
Basura Fernando and Stephen Gould.
In International Journal of Computer Vision (IJCV), 2017.
@inproceedings{Fernando:IJCV2017,
author = {Basura Fernando and
Stephen Gould},
title = {Discriminatively Learned Hierarchical Rank Pooling Networks},
booktitle = {IJCV},
year = {2017}
}
[ paper |
bib ]
|
|
Generalized Rank Pooling for Action Recognition
Anoop Cherian, Basura Fernando, Mehrtash Harandi and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017.
@inproceedings{Cherian:CVPR2017,
author = {Anoop Cherian and
Basura Fernando and
Mehrtash Harandi and
Stephen Gould},
title = {Generalized Rank Pooling for Action Recognition},
booktitle = {CVPR},
year = {2017}
}
[ pdf |
preprint |
bib ]
|
|
DeepPermNet: Visual Permutation Learning
Rodrigo Santa Cruz, Basura Fernando, Anoop Cherian and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017.
@inproceedings{SantaCruz:CVPR2017,
author = {Rodrigo Santa Cruz and
Basura Fernando and
Anoop Cherian and
Stephen Gould},
title = {Visual Permutation Learning},
booktitle = {CVPR},
year = {2017}
}
[ pdf |
preprint |
code |
bib ]
|
|
Self-Supervised Video Representation Learning With Odd-One-Out Networks
Basura Fernando, Hakan Bilen, Efstratios Gavves and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017.
@inproceedings{Fernando:CVPR2017,
author = {Basura Fernando and
Hakan Bilen and
Efstratios Gavves and
Stephen Gould},
title = {Self-Supervised Video Representation Learning With Odd-One-Out Networks},
booktitle = {CVPR},
year = {2017}
}
[ pdf |
preprint |
bib ]
|
|
Higher-order Pooling of CNN Features via Kernel Linearization for Action Recognition
Anoop Cherian, Piotr Koniusz and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV), 2017.
@inproceedings{Cherian:WACV2017,
author = {Anoop Cherian and
Piotr Koniusz and
Stephen Gould},
title = {Higher-order Pooling of {CNN} Features via Kernel Linearization for Action Recognition},
booktitle = {WACV},
year = {2017}
}
[ preprint |
code |
bib ]
|
|
Depth Dropout: Efficient Training of Residual Convolutional Neural Networks
Jian Guo and Stephen Gould.
In Digital Image Computing: Techniques and Applications (DICTA), 2016.
@inproceedings{Guo:DICTA2016,
author = {Jian Guo and
Stephen Gould},
title = {Depth Dropout: Efficient Training of Residual Convolutional Neural Networks},
booktitle = {DICTA},
year = {2016}
}
[ pdf |
bib ]
|
|
SPICE: Semantic Propositional Image Caption Evaluation
Peter Anderson, Basura Fernando, Mark Johnson and Stephen Gould.
In Proceedings of the European Conference on Computer Vision (ECCV), 2016.
@inproceedings{Anderson:ECCV2016,
author = {Peter Anderson and
Basura Fernando and
Mark Johnson and
Stephen Gould},
title = {{SPICE}: Semantic Propositional Image Caption Evaluation},
booktitle = {ECCV},
year = {2016}
}
[ pdf |
project |
code |
bib ]
|
|
Built-in Foreground/Background Prior for Weakly-Supervised Semantic Segmentation
Fatemehsadat Saleh, Mohammad Sadegh Ali Akbarian, Mathieu Salzmann, Lars Petersson, Stephen Gould and Jose M. Alvarez.
In Proceedings of the European Conference on Computer Vision (ECCV), 2016.
@inproceedings{Saleh:ECCV2016,
author = {Fatemehsadat Saleh and
Mohammad Sadegh Ali Akbarian and
Mathieu Salzmann and
Lars Petersson and
Stephen Gould and
Jose M. Alvarez},
title = {Built-in Foreground/Background Prior for Weakly-Supervised Semantic Segmentation},
booktitle = {ECCV},
year = {2016}
}
[ pdf |
arXiv |
bib ]
|
|
On Differentiating Parameterized Argmin and Argmax Problems with Application to Bi-level Optimization
Stephen Gould, Basura Fernando, Anoop Cherian, Peter Anderson, Rodrigo Santa Cruz and Edison Guo.
Technical Report (available online arXiv:1607.05447), 2016.
@techreport{Gould:TR2016,
author = {Stephen Gould and
Basura Fernando and
Anoop Cherian and
Peter Anderson and
Rodrigo Santa Cruz and
Edison Guo},
title = {On Differentiating Parameterized Argmin and Argmax Problems with Application to Bi-level Optimization},
eprint = {arXiv:1607.05447},
month = {July},
year = (2016}
}
[ pdf |
arXiv |
code |
bib ]
|
|
Deep Convolutional Neural Networks for Human Embryonic Cell Counting
Aisha Khan, Stephen Gould and Mathieu Salzmann.
In Workshop on Bioimage Computing (BIC) at ECCV, 2016.
@inproceedings{Khan:BIC2016,
author = {Aisha Khan and
Stephen Gould and
Mathieu Salzmann},
title = {Deep Convolutional Neural Networks for Human Embryonic Cell Counting},
booktitle = {Bioimage Computing at ECCV},
year = {2016}
}
[ pdf |
bib ]
|
|
Learning End-to-end Video Classification with Rank-Pooling
Basura Fernando and Stephen Gould.
In Proceedings of the International Conference on Machine Learning (ICML), 2016.
@inproceedings{Fernando:ICML2016,
author = {Basura Fernando and
Stephen Gould},
title = {Learning End-to-end Video Classification with Rank-Pooling},
booktitle = {ICML},
year = {2016}
}
[ pdf |
bib ]
|
|
Discriminative Hierarchical Rank Pooling for Activity Recognition
Basura Fernando, Peter Anderson, Marcus Hutter and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2016.
@inproceedings{Fernando:CVPR2016,
author = {Basura Fernando and
Peter Anderson and
Marcus Hutter and
Stephen Gould},
title = {Discriminative Hierarchical Rank Pooling for Activity Recognition},
booktitle = {CVPR},
year = {2016}
}
[ pdf |
code |
bib ]
|
|
Dynamic Image Networks for Action Recognition
Hakan Bilen, Basura Fernando, Stratis Gavves, Andrea Vedaldi and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2016.
@inproceedings{Bilen:CVPR2016,
author = {Hakan Bilen and
Basura Fernando and
Stratis Gavves and
Andrea Vedaldi and
Stephen Gould},
title = {Dynamic Image Networks for Action Recognition},
booktitle = {CVPR},
year = {2016}
}
[ pdf |
code |
bib ]
|
|
Segmentation of Developing Human Embryo in Time-lapse Microscopy
Aisha Khan, Stephen Gould and Mathieu Salzmann.
In IEEE International Symposium on Biomedical Imaging (ISBI), 2016.
@inproceedings{Khan:ISBI2016,
author = {Aisha Khan and
Stephen Gould and
Mathieu Salzmann},
title = {Segmentation of Developing Human Embryo in Time-lapse Microscopy},
booktitle = {ISBI},
year = {2016}
}
[ pdf |
bib ]
|
|
Hierarchical Higher-order Regression Forest Fields: An Application to 3D Indoor Scene Labelling
Trung T. Pham, Ian Reid, Yasir Latif and Stephen Gould.
In IEEE International Conference on Computer Vision (ICCV), 2015.
@inproceedings{Pham:ICCV2015,
author = {Trung T. Pham and
Ian Reid and
Yasir Latif and
Stephen Gould},
title = {Hierarchical Higher-order Regression Forest Fields: An Application to 3D Indoor Scene Labelling},
booktitle = {ICCV},
year = {2015}
}
[ pdf |
bib ]
|
|
Detecting Abnormal Cell Division Patterns in Early Stage Human Embryo Development
Aisha Khan, Stephen Gould and Mathieu Salzmann.
In 6th International Workshop on Machine Learning in Medical Imaging (MLMI) at MICCAI, 2015.
@inproceedings{Khan:MLMI2015,
author = {Aisha Khan and
Stephen Gould and
Mathieu Salzmann},
title = {Detecting Abnormal Cell Division Patterns in Early Stage Human Embryo Development},
booktitle = {6th International Workshop on Machine Learning in Medical Imaging (MLMI)},
year = {2015}
}
[ pdf |
bib ]
|
|
Automated Monitoring of Human Embryonic Cells up to the 5-cell Stage in Time-lapse Microscopy Images
Aisha Khan, Stephen Gould and Mathieu Salzmann.
In IEEE International Symposium on Biomedical Imaging (ISBI), 2015.
@inproceedings{Khan:ISBI2015,
author = {Aisha Khan and
Stephen Gould and
Mathieu Salzmann},
title = {Automated Monitoring of Human Embryonic Cells up to the 5-cell Stage in Time-lapse Microscopy Images},
booktitle = {ISBI},
year = {2015}
}
[ pdf |
bib ]
|
|
Multi-target Tracking with Time-varying Clutter Rate and Detection Profile: Application to Time-lapse Cell Microscopy Sequences
Seyed Hamid Rezatofighi, Stephen Gould, Ba-Tuong Vo, Ba-Ngu Vo, Katarina Mele and Richard Hartley.
In IEEE Transactions on Medical Imaging (TMI), 2015.
@article{Rezatofighi:TMI2015,
author = {Seyed Hamid Rezatofighi and
Stephen Gould and
Ba-Tuong Vo and
Ba-Ngu Vo and
Katarina Mele and
Richard Hartley},
title = {Multi-target Tracking with Time-varying Clutter Rate and Detection Profile: Application to Time-lapse Cell Microscopy Sequences},
journal = {IEEE Trans. on Medical Imaging},
volume = {34},
month = {June},
year = {2015}
}
[ pdf |
bib ]
|
|
Multi-class Semantic Video Segmentation with Exemplar-based Object Reasoning
Buyu Liu, Stephen Gould and Xuming He.
In IEEE Winter Conference on Applications of Computer Vision (WACV),
2015.
@inproceedings{Liu:WACV2015,
author = {Buyu Liu and
Stephen Gould and
Xuming He},
title = {Multi-class Semantic Video Segmentation with Exemplar-based Object Reasoning},
booktitle = {WACV},
year = {2015}
}
[ pdf |
bib ]
|
|
A Linear Chain Markov Model for Detection and Localization of Cells in Early Stage Embryo Development
Aisha Khan, Stephen Gould and Mathieu Salzmann.
In IEEE Winter Conference on Applications of Computer Vision (WACV),
2015.
@inproceedings{Khan:WACV2015,
author = {Aisha Khan and
Stephen Gould and
Mathieu Salzmann},
title = {A Linear Chain Markov Model for Detection and Localization of Cells in Early Stage Embryo Development},
booktitle = {WACV},
year = {2015}
}
[ pdf |
bib ]
|
|
Learning Weighted Lower Linear Envelope Potentials in Binary Markov Random Fields
Stephen Gould.
In IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI),
2015.
@article{Gould:PAMI2015,
author = {Stephen Gould},
title = {Learning Weighted Lower Linear Envelope Potentials in Binary Markov Random Fields},
journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)},
volume = {37},
issue = {7},
pages = {1336--1346},
year = {2015}
}
[ pdf |
code |
bib ]
|
|
Scene Understanding by Labeling Pixels
Stephen Gould and Xuming He.
In Communications of the ACM (CACM),
2014.
@article{Gould:CACM2014,
author = {Stephen Gould and
Xuming He},
title = {Scene Understanding by Labeling Pixels},
journal = {Communications of the ACM (CACM)},
pages = {68-77},
volume = {57},
number = {11},
month = {Nov},
year = {2014}
}
[ pdf |
link |
video |
bib ]
|
|
Determining Interacting Objects in Human-Centric Activities via Qualitative Spatio-temporal Reasoning
Hajar Sadeghi Sokeh, Stephen Gould and Jochen Renz.
In Proceedings of the Asian Conference on Computer Vision (ACCV),
2014.
@inproceedings{Sokeh:ACCV2014,
author = {Hajar Sadeghi Sokeh and
Stephen Gould and
Jochen Renz},
title = {Determining Interacting Objects in Human-Centric Activities via Qualitative Spatio-temporal Reasoning},
booktitle = {ACCV},
year = {2014}
}
[ pdf |
bib ]
|
|
Superpixel Graph Label Transfer with Learned Distance Metric
Stephen Gould, Jiecheng Zhao, Xuming He and Yuhang Zhang.
In Proceedings of the European Conference on Computer Vision (ECCV),
2014.
@inproceedings{Gould:ECCV2014,
author = {Stephen Gould and
Jiecheng Zhao and
Xuming He and
Yuhang Zhang},
title = {Superpixel Graph Label Transfer with Learned Distance Metric},
booktitle = {ECCV},
year = {2014}
}
[ pdf |
code |
bib ]
|
|
An Exemplar-based CRF for Multi-instance Object Segmentation
Xuming He and Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR),
2014.
@inproceedings{He:CVPR2014,
author = {Xuming He and
Stephen Gould},
title = {An Exemplar-based CRF for Multi-instance Object Segmentation},
booktitle = {CVPR},
year = {2014}
}
[ pdf |
bib ]
|
|
Joint Semantic and Geometric Segmentation of Videos with a Stage Model
Buyu Liu, Xuming He and Stephen Gould.
In IEEE Winter Conference on Applications of Computer Vision (WACV),
2014.
@inproceedings{Liu:WACV2014,
author = {Buyu Liu and
Xuming He and
Stephen Gould},
title = {Joint Semantic and Geometric Segmentation of Videos with a Stage Model},
booktitle = {WACV},
year = {2014}
}
[ pdf |
bib ]
|
|
A Unified Graphical Models Framework for Automated Mitosis Detection in Human Embryos
Farshid Moussavi, Wang Yu, Peter Lorenzen, Jonathan Oakley, Daniel Russakoff and Stephen Gould.
In IEEE Transactions on Medical Imaging (TMI), 2014.
A shorter version of this paper appeared in IEEE International Symposium on Biomedical Imaging (ISBI), 2014.
@inproceedings{Moussavi:ISBI2014,
author = {Farshid Moussavi and
Wang Yu and
Peter Lorenzen and
Jonathan Oakley and
Daniel Russakoff and
Stephen Gould},
title = {A Unified Graphical Models Framework for Automated Human Embryo Tracking in Time Lapse Microscopy},
booktitle = {ISBI},
year = {2014}
}
@article{Moussavi:TMI2014,
author = {Farshid Moussavi and
Wang Yu and
Peter Lorenzen and
Jonathan Oakley and
Daniel Russakoff and
Stephen Gould},
title = {A Unified Graphical Models Framework for Automated Mitosis Detection in Human Embryos},
booktitle = {IEEE Trans. on Medical Imaging},
volume = {22},
pages = {1551--1562},
year = {2014}
}
[ pdf |
bib ]
|
|
Efficient Extraction and Representation of Spatial Information from Video Data
Hajar Sadeghi Sokeh, Stephen Gould and Jochen Renz.
In Proceedings of the Twenty Third International Joint Conference on Artificial Intelligence (IJCAI),
2013.
@inproceedings{Sokeh:IJCAI2013,
author = {Hajar Sadeghi Sokeh and
Stephen Gould and
Jochen Renz},
title = {Efficient Extraction and Representation of Spatial Information from Video Data},
booktitle = {IJCAI},
year = {2013}
}
[ pdf |
bib ]
|
|
Discriminative Learning with Latent Variables for Cluttered Indoor Scene Understanding
Huayan Wang, Stephen Gould and Daphne Koller.
In Communications of the ACM, Research Highlights,
2013.
An earlier version of this work appeared in Proceedings of the European Conference on Computer Vision (ECCV),
2010.
@article{Wang:CACM2013,
author = {Huayan Wang and
Stephen Gould and
Daphne Koller},
title = {Discriminative Learning with Latent Variables for Cluttered Indoor Scene Understanding},
journal = {Communications of the ACM, Research Highlights},
pages = {92-99},
volume = {56},
month = {Apr},
year = {2013}
}
@inproceedings{Wang:ECCV2010,
author = {Huayan Wang and
Stephen Gould and
Daphne Koller},
title = {Discriminative Learning with Latent Variables for Cluttered Indoor Scene Understanding},
booktitle = {ECCV},
year = {2010}
}
[ pdf (cacm) |
pdf (eccv) |
link |
bib ]
|
|
A Multiple Model Probability Hypothesis Density Tracker for Time-lapse
Cell Microscopy Sequences
Seyed Hamid Rezatofighi, Stephen Gould, Ba-Ngu Vo, Katarina Mele, William E. Hughes and Richard Hartley.
In International Conference on Information Processing in Medical Imaging (IPMI),
2013.
@inproceedings{Rezatofighi:IPMI2013,
author = {Hamid Rezatofighi and
Stephen Gould and
Ba-Ngu Vo and
Katarina Mele and
William E. Hughes and
Richard Hartley},
title = {A Multiple Model Probability Hypothesis Density Tracker for Time-lapse Cell Microscopy Sequences},
booktitle = {IPMI},
year = {2013}
}
[ pdf |
bib ]
|
|
A Framework for Generating Realistic Synthetic Sequences of Total
Internal Reflection Flourescence Microscopy Images
Seyed Hamid Rezatofighi, William T. E. Pitkeathly, Stephen Gould, Richard Hartley, Katarina Mele, William E. Hughes and James G. Burchfield.
In Proceedings of the International Symposium on Biomedical Imaging (ISBI),
2013.
@inproceedings{Rezatofighi:ISBI2013,
author = {Hamid Rezatofighi and
William T. E. Pitkeathly and
Stephen Gould and
Richard Hartley and
Katarina Mele and
William E. Hughes and
James G. Burchfield},
title = {A Framework for Generating Realistic Synthetic Sequences of Total Internal Reflection Flourescence Microscopy Images},
booktitle = {ISBI},
year = {2013}
}
[ pdf |
code |
bib ]
|
|
DARWIN: A Framework for Machine Learning and Computer Vision Research and Development
Stephen Gould.
In Journal of Machine Learning Research (JMLR),
2012.
@article{Gould:JMLR2012,
author = {Stephen Gould},
title = {{DARWIN}: A Framework for Machine Learning and Computer Vision Research and Development},
journal = {Journal of Machine Learning Research (JMLR)},
pages = {3533-3537},
volume = {13},
month = {Dec},
year = {2012}
}
[ pdf |
code |
mloss |
bib ]
|
|
Towards Unsupervised Semantic Segmentation of Street Scenes From Motion Cues
Hajar Sadeghi Sokeh and Stephen Gould.
In Proceedings of the International Conference on Image and Vision Computing New Zealand (IVCNZ),
2012.
@inproceedings{Sokeh:IVCNZ2012,
author = {Hajar Sadeghi Sokeh and
Stephen Gould},
title = {Towards Unsupervised Semantic Segmentation of Street Scenes From Motion Cues},
booktitle = {IVCNZ},
year = {2012}
}
[ pdf |
bib ]
|
|
A Noise Tolerant Watershed Transformation with Viscous Force for Seeded Image Segmentation
Di Yang, Stephen Gould and Marcus Hutter.
In Proceedings of the Asian Conference on Computer Vision (ACCV),
2012.
@inproceedings{Yang:ACCV2012,
author = {Di Yang and
Stephen Gould and
Marcus Hutter},
title = {A Noise Tolerant Watershed Transformation with Viscous Force for Seeded Image Segmentation},
booktitle = {ACCV},
year = {2012}
}
[ pdf |
code |
bib ]
|
|
PatchMatchGraph: Building a Graph of Dense Patch Correspondences for Label Transfer
Stephen Gould and Yuhang Zhang.
In Proceedings of the European Conference on Computer Vision (ECCV),
2012.
@inproceedings{Gould:ECCV2012,
author = {Stephen Gould and
Yuhang Zhang},
title = {{P}atch{M}atch{G}raph: Building a Graph of Dense Patch Correspondences for Label Transfer},
booktitle = {ECCV},
year = {2012}
}
[ pdf |
code |
polo dataset (32MB) |
stanford dataset (15MB) |
bib ]
|
|
On Learning Higher-Order Consistency Potentials for Multi-class Pixel Labeling
Kyoungup Park and Stephen Gould.
In Proceedings of the European Conference on Computer Vision (ECCV),
2012.
@inproceedings{Park:ECCV2012,
author = {Kyoungup Park and
Stephen Gould},
title = {On Learning Higher-Order Consistency Potentials for Multi-class Pixel Labeling},
booktitle = {ECCV},
year = {2012}
}
[ pdf |
bib ]
|
|
Application of the IMM-JPDA Filter to Multiple Target Tracking in
Total Internal Reflection Fluorescence Microscopy Images
Seyed Hamid Rezatofighi, Stephen Gould, Richard Hartley, Katarina Mele and William E. Hughes.
In Proceedings of the International Conference on Medical Image Computing and Computer Assisted Intervention (MICCAI),
2012.
@inproceedings{Rezatofighi:MICCAI2012,
author = {Hamid Rezatofighi and
Stephen Gould and
Richard Hartley and
Katarina Mele and
William E. Hughes},
title = {Application of the {IMM-JPDA} Filter to Multiple Target Tracking in Total Internal Reflection Fluorescence Microscopy Images},
booktitle = {MICCAI},
year = {2012}
}
[ pdf |
bib ]
|
|
Multiclass Pixel Labeling with Non-Local Matching Constraints
Stephen Gould.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR),
2012.
@inproceedings{Gould:CVPR2012,
author = {Stephen Gould},
title = {Multiclass Pixel Labeling with Non-Local Matching Constraints},
booktitle = {CVPR},
year = {2012}
}
[ pdf |
bib ]
|
|
Simultaneous Multi-class Pixel Labeling over Coherent Image Sets
Paul Rivera and Stephen Gould.
In Digital Image Computing: Techniques and Applications (DICTA),
2011.
@inproceedings{Rivera:DICTA2011,
author = {Paul Rivera and
Stephen Gould},
title = {Simultaneous Multi-class Pixel Labeling over Coherent Image Sets},
booktitle = {DICTA},
year = {2011}
}
[ pdf |
bib ]
|
|
Max-margin Learning for Lower Linear Envelope Potentials in Binary Markov Random Fields
Stephen Gould.
In Proceedings of the International Conference on Machine Learning (ICML),
2011.
@inproceedings{Gould:ICML2011,
author = {Stephen Gould},
title = {Max-margin Learning for Lower Linear Envelope Potentials in Binary Markov Random Fields},
booktitle = {ICML},
year = {2011}
}
[ pdf |
code |
slides (.pdf) |
bib ]
|
|
A Unified Contour-Pixel Model for Segmentation
Ben Packer, Stephen Gould and Daphne Koller.
In Proceedings of the European Conference on Computer Vision (ECCV),
2010.
@inproceedings{Packer:ECCV2010,
author = {Ben Packer and
Stephen Gould and
Daphne Koller},
title = {A Unified Contour-Pixel Model for Segmentation},
booktitle = {ECCV},
year = {2010}
}
[ pdf |
bib ]
|
|
Probabilistic Models for Region-based Scene Understanding
Stephen Gould.
Ph.D. Thesis, Stanford University,
June 2010.
@phdthesis{Gould:PhD2010,
author = {Stephen Gould},
title = {Probabilistic Models for Region-based Scene Understanding},
school = {Stanford University},
month = {June},
year = {2010}
}
[ pdf |
archive |
bib ]
|
|
Accelerated Dual Decomposition for MAP Inference
Vladimir Jojic, Stephen Gould and Daphne Koller.
In Proceedings of the International Conference on Machine Learning (ICML),
2010.
@inproceedings{Jojic:ICML2010,
author = {Vladimir Jojic and
Stephen Gould and
Daphne Koller},
title = {Accelerated Dual Decomposition for {MAP} Inference},
booktitle = {ICML},
year = {2010}
}
[ pdf |
bib ]
|
|
Single Image Depth Estimation from Predicted Semantic Labels
Beyang Liu, Stephen Gould and Daphne Koller.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR),
2010.
@inproceedings{Liu:CVPR2010,
author = {Beyang Liu and
Stephen Gould and
Daphne Koller},
title = {Single Image Depth Estimation from Predicted Semantic Labels},
booktitle = {CVPR},
year = {2010}
}
[ pdf |
data (.tar.gz) |
bib ]
|
|
Region-based Segmentation and Object Detection
Stephen Gould, Tianshi Gao and Daphne Koller.
In Advances in Neural Information Processing Systems (NeurIPS),
2009.
@inproceedings{Gould:NeurIPS09,
author = {Stephen Gould and
Tianshi Gao and
Daphne Koller},
title = {Region-based Segmentation and Object Detection},
booktitle = {NeurIPS},
year = {2009}
}
[ pdf |
bib ]
|
|
Decomposing a Scene into Geometric and Semantically Consistent Regions
Stephen Gould, Rick Fulton and Daphne Koller.
In IEEE International Conference on Computer Vision (ICCV),
2009.
@inproceedings{Gould:ICCV09,
author = {Stephen Gould and
Richard Fulton and
Daphne Koller},
title = {Decomposing a Scene into Geometric and Semantically Consistent Regions},
booktitle = {ICCV},
year = {2009}
}
[ pdf |
slides (.pdf) |
inference (.wmv) |
data (.tar.gz) |
bib ]
|
|
Alphabet SOUP: A Framework for Approximate Energy Minimization
Stephen Gould, Fernando Amat and Daphne Koller.
In IEEE Conference on Computer Vision and Pattern Recognition (CVPR),
2009.
@inproceedings{Gould:CVPR09,
author = {Stephen Gould and
Fernando Amat and
Daphne Koller},
title = {Alphabet {SOUP}: A Framework for Approximate Energy Minimization},
booktitle = {CVPR},
year = {2009}
}
[ pdf |
erratum |
poster |
bib ]
|
|
High-Accuracy 3D Sensing for Mobile Manipulation: Improving Object Detection and Door Opening
Morgan Quigley, Siddharth Batra, Stephen Gould, Ellen Klingbeil, Quoc V. Le, Ashley Wellman and Andrew Y. Ng.
In IEEE International Conference on Robotics and Automation (ICRA),
2009.
@inproceedings{Quigley:ICRA09,
author = {Morgan Quigley and
Siddharth Batra and
Stephen Gould and
Ellen Klingbeil and
Quoc V. Le and
Ashley Wellman and
Andrew Y. Ng},
title = {High-Accuracy 3{D} Sensing for Mobile Manipulation: Improving Object Detection and Door Opening},
booktitle = {ICRA},
year = {2009}
}
[ pdf |
videos |
bib ]
|
|
Cascaded Classification Models: Combining Models for Holistic Scene Understanding
Geremy Heitz, Stephen Gould, Ashutosh Saxena and Daphne Koller.
In Advances in Neural Information Processing Systems (NeurIPS),
2008.
@inproceedings{Heitz:NeurIPS08,
author = {Geremy Heitz and
Stephen Gould and
Ashutosh Saxena and
Daphne Koller},
title = {Cascaded Classification Models: Combining Models for Holistic Scene Understanding},
booktitle = {NeurIPS},
year = {2008}
}
[ pdf |
bib ]
|
|
Learning Bounded Treewidth Bayesian Networks
Gal Elidan and Stephen Gould.
In Advances in Neural Information Processing Systems (NeurIPS),
2008.
A longer version of this paper also appears
in Journal of Machine Learning Research (JMLR),
2008.
@inproceedings{Elidan:NeurIPS08,
author = {Gal Elidan and
Stephen Gould},
title = {Learning Bounded Treewidth Bayesian Networks},
booktitle = {NeurIPS},
year = {2008}
}
@article{Elidan:JMLR08,
author = {Gal Elidan and
Stephen Gould},
title = {Learning Bounded Treewidth Bayesian Networks},
journal = {Journal of Machine Learning Research},
year = 2008,
volume = 9,
month = December,
pages = {2699--2731},
}
[ pdf (nips) |
pdf (jmlr) |
bib ]
|
|
Integrating Visual and Range Data for Robotic Object Detection
Stephen Gould, Paul Baumstarck, Morgan Quigley, Andrew Y. Ng and Daphne Koller.
In ECCV workshop on Multi-camera and Multi-modal Sensor Fusion Algorithms and Applications (M2SFA2),
2008.
@inproceedings{Gould:M2SFA208,
author = {Stephen Gould and
Paul Baumstarck and
Morgan Quigley and
Andrew Y. Ng and
Daphne Koller},
title = {Integrating Visual and Range Data for Robotic Object Detection},
booktitle = {ECCV Workshop on Multi-camera and Multi-modal Sensor Fusion Algorithms and Applications (M2SFA2)},
year = {2008}
}
[ pdf |
bib ]
|
|
Projected Subgradient Methods for Learning Sparse Gaussians
John Duchi, Stephen Gould and Daphne Koller.
In Proceedings of the Twenty-Fourth Conference on Uncertainty in Artificial Intelligence (UAI),
2008.
@inproceedings{Duchi:UAI08,
author = {John C. Duchi and
Stephen Gould and
Daphne Koller},
title = {Projected Subgradient Methods for Learning Sparse Gaussians},
booktitle = {UAI},
year = {2008},
pages = {145--152}
}
[ pdf |
bib ]
|
|
Multi-Class Segmentation with Relative Location Prior
Stephen Gould, Jim Rodgers, David Cohen, Gal Elidan and Daphne Koller.
In International Journal of Computer Vision (IJCV),
2008.
@article{Gould:IJCV08,
author = {Stephen Gould and
Jim Rodgers and
David Cohen and
Gal Elidan and
Daphne Koller},
title = {Multi-class Segmentation with Relative Location Prior},
journal = {IJCV},
volume = {80},
number = {3},
year = {2008},
pages = {300--316}
}
[ pdf |
bib ]
|
|
STAIR: The STanford Artificial Intelligence Robot Project
Andrew Y. Ng, Stephen Gould, Morgan Quigley, Ashutosh Saxena and Eric Berger.
In Learning Workshop, Snowbird,
2008.
[ project ]
|
|
Peripheral-Foveal Vision for Real-time Object Recognition and Tracking in Video
Stephen Gould, Joakim Arfvidsson, Adrian Kaehler, Benjamin Sapp,
Marius Meissner, Gary Bradski, Paul Baumstarck, Sukwon Chung and Andrew Y. Ng.
In Proceedings of the Twentieth International Joint Conference on Artificial Intelligence (IJCAI),
2007.
@inproceedings{Gould:IJCAI07,
author = {Stephen Gould and
Joakim Arfvidsson and
Adrian Kaehler and
Benjamin Sapp and
Marius Messner and
Gary R. Bradski and
Paul Baumstarck and
Sukwon Chung and
Andrew Y. Ng},
title = {Peripheral-Foveal Vision for Real-time Object Recognition and Tracking in Video},
booktitle = {IJCAI},
year = {2007},
pages = {2115-2121},
url = {http://www.ijcai.org/papers07/Papers/IJCAI07-341.pdf}
}
[ pdf |
bib ]
|